diff --git "a/llm.mnn.json" "b/llm.mnn.json" new file mode 100644--- /dev/null +++ "b/llm.mnn.json" @@ -0,0 +1,31130 @@ + +{ "bizCode": "MNNTest", "extraInfo": +{ "version": "3.4.0" } +, "oplists": +[ +{ "main_type": "Input", "main": +{ "dims": +[ 1, 1, 4096 ] +, "dtype": "DT_FLOAT", "dformat": "NCHW" } +, "name": "input_ids", "outputIndexes": +[ 2 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 1, 1, -1, -1 ] +, "dtype": "DT_FLOAT", "dformat": "NCHW" } +, "name": "attention_mask", "outputIndexes": +[ 124 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 1, -1 ] +, "dtype": "DT_INT32", "dformat": "NCHW" } +, "name": "position_ids", "outputIndexes": +[ 0 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 1 ] +, "dtype": "DT_INT32", "dformat": "NCHW" } +, "name": "logits_index", "outputIndexes": +[ 1 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 3 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1, -1, 4096 ] + } +, "name": "/blocks.0/Constant_output_0", "outputIndexes": +[ 3 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/Reshape_output_0", "outputIndexes": +[ 4 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 4 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 0, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.0/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 5 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 5 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 2897 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2897 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 2898 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2898 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 32768, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": +[ 2899 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2899 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 2900 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2900 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 6 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 5 ] +, "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_output_0", "outputIndexes": +[ 7 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 7 ] +, "main_type": "NONE", "name": "Shape21", "outputIndexes": +[ 8 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 7 ] +, "main_type": "NONE", "name": "Rank23", "outputIndexes": +[ 9 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 9, 9 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp25", "outputIndexes": +[ 10 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 10 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze26", "outputIndexes": +[ 11 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1 ] + } +, "name": "Const27", "outputIndexes": +[ 12 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 10, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp28", "outputIndexes": +[ 13 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 13 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze29", "outputIndexes": +[ 14 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1 ] + } +, "name": "Unsqueeze31", "outputIndexes": +[ 15 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 8, 11, 14, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice32", "outputIndexes": +[ 16 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze33", "outputIndexes": +[ 17 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 17, 17 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp35", "outputIndexes": +[ 18 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 7, 18, 10 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_output_0", "outputIndexes": +[ 19 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 0 ] + } +, "name": "/rotary/Constant_3_output_0", "outputIndexes": +[ 20 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 19, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 21 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 10 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze45", "outputIndexes": +[ 22 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 13 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze48", "outputIndexes": +[ 23 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 8, 22, 23, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice51", "outputIndexes": +[ 24 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze52", "outputIndexes": +[ 25 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 25 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp53", "outputIndexes": +[ 26 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 26, 25 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp54", "outputIndexes": +[ 27 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 7, 27, 10 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_1_output_0", "outputIndexes": +[ 28 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 28, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 29 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 32 ] + } +, "name": "/blocks.0/self_attn/Constant_2_output_0", "outputIndexes": +[ 30 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 128 ] + } +, "name": "/blocks.0/self_attn/Constant_3_output_0", "outputIndexes": +[ 31 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 21, 29, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.0/self_attn/Concat_output_0", "outputIndexes": +[ 32 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 6, 32 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/self_attn/Reshape_output_0", "outputIndexes": +[ 33 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 0 ] +, "main_type": "CastParam", "main": +{ "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } +, "name": "/rotary/Cast_output_0", "outputIndexes": +[ 34 ] +, "type": "Cast", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 2 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ -1, 1 ] + } +, "name": "/rotary/Constant_output_0", "outputIndexes": +[ 35 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 34, 35 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/rotary/Reshape_output_0", "outputIndexes": +[ 36 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 64 ] +, "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 1.0, 0.814617, 0.663601, 0.540581, 0.440367, 0.35873, 0.292228, 0.238054, 0.193923, 0.157973, 0.128687, 0.104831, 0.085397, 0.069566, 0.05667, 0.046164, 0.037606, 0.030635, 0.024955, 0.020329, 0.01656, 0.01349, 0.01099, 0.008952, 0.007293, 0.005941, 0.004839, 0.003942, 0.003211, 0.002616, 0.002131, 0.001736, 0.001414, 0.001152, 0.000938, 0.000764, 0.000623, 0.000507, 0.000413, 0.000337, 0.000274, 0.000223, 0.000182, 0.000148, 0.000121, 0.000098, 0.00008, 0.000065, 0.000053, 0.000043, 0.000035, 0.000029, 0.000023, 0.000019, 0.000016, 0.000013, 0.00001, 0.000008, 0.000007, 0.000006, 0.000005, 0.000004, 0.000003, 0.000002 ] + } +, "name": "/rotary/Constant_1_output_0", "outputIndexes": +[ 37 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 36, 37 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/rotary/Mul_output_0", "outputIndexes": +[ 38 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 38 ] +, "main_type": "UnaryOp", "main": +{ "opType": "COS", "T": "DT_FLOAT" } +, "name": "/rotary/Cos_output_0", "outputIndexes": +[ 39 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 39, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_output_0", "outputIndexes": +[ 40 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 38 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SIN", "T": "DT_FLOAT" } +, "name": "/rotary/Sin_output_0", "outputIndexes": +[ 41 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 41, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": +[ 42 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 40, 42 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/rotary/Concat_output_0", "outputIndexes": +[ 43 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 43, 43 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/rotary/Concat_1_output_0", "outputIndexes": +[ 44 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 2 ] + } +, "name": "/rotary/Constant_5_output_0", "outputIndexes": +[ 45 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 44, 45 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": +[ 46 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 46, 15 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": +[ 47 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 47 ] +, "main_type": "NONE", "name": "Shape76", "outputIndexes": +[ 48 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 47 ] +, "main_type": "NONE", "name": "Rank78", "outputIndexes": +[ 49 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 49, 49 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp80", "outputIndexes": +[ 50 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 50 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze81", "outputIndexes": +[ 51 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 50, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp83", "outputIndexes": +[ 52 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 52 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze84", "outputIndexes": +[ 53 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 48, 51, 53, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice87", "outputIndexes": +[ 54 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 54 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze88", "outputIndexes": +[ 55 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 55, 55 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp90", "outputIndexes": +[ 56 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 47, 56, 50 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_2_output_0", "outputIndexes": +[ 57 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 33, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_output_0", "outputIndexes": +[ 58 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 33 ] +, "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_2_output_0", "outputIndexes": +[ 59 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 3 ] + } +, "name": "/blocks.0/self_attn/Constant_8_output_0", "outputIndexes": +[ 60 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 59 ] +, "main_type": "NONE", "name": "Shape95", "outputIndexes": +[ 61 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 59 ] +, "main_type": "NONE", "name": "Rank97", "outputIndexes": +[ 62 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 62, 62 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp99", "outputIndexes": +[ 63 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 63 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze100", "outputIndexes": +[ 64 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 63, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp102", "outputIndexes": +[ 65 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 65 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze103", "outputIndexes": +[ 66 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 61, 64, 66, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice106", "outputIndexes": +[ 67 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 67 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze107", "outputIndexes": +[ 68 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 68 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp108", "outputIndexes": +[ 69 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 69, 68 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp109", "outputIndexes": +[ 70 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 59, 70, 63 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_4_output_0", "outputIndexes": +[ 71 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 2 ] + } +, "name": "/blocks.0/self_attn/Constant_9_output_0", "outputIndexes": +[ 72 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 71, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Div_output_0", "outputIndexes": +[ 73 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 73, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 74 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1073741824 ] + } +, "name": "/blocks.0/self_attn/Constant_16_output_0", "outputIndexes": +[ 75 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 3 ] + } +, "name": "/blocks.0/self_attn/Constant_10_output_0", "outputIndexes": +[ 76 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 33, 74, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_1_output_0", "outputIndexes": +[ 77 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 77 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.0/self_attn/Neg_output_0", "outputIndexes": +[ 78 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 73, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 79 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 33, 20, 79, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_output_0", "outputIndexes": +[ 80 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 78, 80 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.0/self_attn/Concat_3_output_0", "outputIndexes": +[ 81 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 50 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze127", "outputIndexes": +[ 82 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 52 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze130", "outputIndexes": +[ 83 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 48, 82, 83, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice133", "outputIndexes": +[ 84 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 84 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze134", "outputIndexes": +[ 85 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 85 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp135", "outputIndexes": +[ 86 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 86, 85 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp136", "outputIndexes": +[ 87 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 47, 87, 50 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_3_output_0", "outputIndexes": +[ 88 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 81, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_1_output_0", "outputIndexes": +[ 89 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 58, 89 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Add_output_0", "outputIndexes": +[ 90 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2898 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 9469974, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": +[ 2903 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2903 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 2904 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2904 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 91 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 19, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 92 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 28, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 93 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 8 ] + } +, "name": "/blocks.0/self_attn/Constant_4_output_0", "outputIndexes": +[ 94 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 92, 93, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.0/self_attn/Concat_1_output_0", "outputIndexes": +[ 95 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 91, 95 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/self_attn/Reshape_1_output_0", "outputIndexes": +[ 96 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 96, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_2_output_0", "outputIndexes": +[ 97 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 96 ] +, "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_3_output_0", "outputIndexes": +[ 98 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 98 ] +, "main_type": "NONE", "name": "Shape148", "outputIndexes": +[ 99 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 98 ] +, "main_type": "NONE", "name": "Rank150", "outputIndexes": +[ 100 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 100, 100 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp152", "outputIndexes": +[ 101 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 101 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze153", "outputIndexes": +[ 102 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 101, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp155", "outputIndexes": +[ 103 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 103 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze156", "outputIndexes": +[ 104 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 99, 102, 104, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice159", "outputIndexes": +[ 105 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 105 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze160", "outputIndexes": +[ 106 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 106 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp161", "outputIndexes": +[ 107 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 107, 106 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp162", "outputIndexes": +[ 108 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 98, 108, 101 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_5_output_0", "outputIndexes": +[ 109 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 109, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Div_1_output_0", "outputIndexes": +[ 110 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 110, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 111 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 96, 111, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_3_output_0", "outputIndexes": +[ 112 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 112 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.0/self_attn/Neg_1_output_0", "outputIndexes": +[ 113 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 110, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 114 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 96, 20, 114, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_2_output_0", "outputIndexes": +[ 115 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 113, 115 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.0/self_attn/Concat_4_output_0", "outputIndexes": +[ 116 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 116, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_3_output_0", "outputIndexes": +[ 117 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 97, 117 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Add_1_output_0", "outputIndexes": +[ 118 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2898 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 11829292, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": +[ 2907 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2907 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 2908 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2908 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 119 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 19, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 120 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 28, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 121 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 120, 121, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.0/self_attn/Concat_2_output_0", "outputIndexes": +[ 122 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 119, 122 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/self_attn/Reshape_2_output_0", "outputIndexes": +[ 123 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 90, 118, 123, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.0/self_attn/FusedAttention", "outputIndexes": +[ 125 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 125 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 2909 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2909 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 2910 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2910 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 14188610, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": +[ 2911 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2911 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 2912 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2912 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 126 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 4, 126 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/Add_output_0", "outputIndexes": +[ 127 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 127 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 23625816, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.0/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 128 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 128 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 2913 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2913 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 2914 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2914 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 23658584, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": +[ 2915 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2915 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 2916 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2916 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 129 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 129 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.0/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 130 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2914 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 56688750, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": +[ 2919 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2919 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 2920 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2920 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 131 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 130, 131 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/Mul_output_0", "outputIndexes": +[ 132 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 2921 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2921 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 2922 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2922 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 89718916, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": +[ 2923 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2923 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 2924 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2924 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 133 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 127, 133 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/Add_1_output_0", "outputIndexes": +[ 134 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/Reshape_output_0", "outputIndexes": +[ 135 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 135 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 122749082, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.1/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 136 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 2925 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2925 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 2926 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2926 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 122781850, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": +[ 2927 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2927 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 2928 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2928 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 137 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_output_0", "outputIndexes": +[ 138 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 138 ] +, "main_type": "NONE", "name": "Shape209", "outputIndexes": +[ 139 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 138 ] +, "main_type": "NONE", "name": "Rank211", "outputIndexes": +[ 140 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 140, 140 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp213", "outputIndexes": +[ 141 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 141 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze214", "outputIndexes": +[ 142 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 141, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp216", "outputIndexes": +[ 143 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 143 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze217", "outputIndexes": +[ 144 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 139, 142, 144, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice220", "outputIndexes": +[ 145 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 145 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze221", "outputIndexes": +[ 146 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 146, 146 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp223", "outputIndexes": +[ 147 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 138, 147, 141 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_output_0", "outputIndexes": +[ 148 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 149 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 141 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze231", "outputIndexes": +[ 150 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 143 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze234", "outputIndexes": +[ 151 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 139, 150, 151, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice237", "outputIndexes": +[ 152 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze238", "outputIndexes": +[ 153 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 153 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp239", "outputIndexes": +[ 154 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 154, 153 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp240", "outputIndexes": +[ 155 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 138, 155, 141 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_1_output_0", "outputIndexes": +[ 156 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 156, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 157 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 149, 157, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.1/self_attn/Concat_output_0", "outputIndexes": +[ 158 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 137, 158 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/self_attn/Reshape_output_0", "outputIndexes": +[ 159 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 159, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_output_0", "outputIndexes": +[ 160 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 159 ] +, "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_2_output_0", "outputIndexes": +[ 161 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 161 ] +, "main_type": "NONE", "name": "Shape247", "outputIndexes": +[ 162 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 161 ] +, "main_type": "NONE", "name": "Rank249", "outputIndexes": +[ 163 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 163, 163 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp251", "outputIndexes": +[ 164 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 164 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze252", "outputIndexes": +[ 165 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 164, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp254", "outputIndexes": +[ 166 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 166 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze255", "outputIndexes": +[ 167 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 162, 165, 167, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice258", "outputIndexes": +[ 168 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 168 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze259", "outputIndexes": +[ 169 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 169 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp260", "outputIndexes": +[ 170 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 170, 169 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp261", "outputIndexes": +[ 171 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 161, 171, 164 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_2_output_0", "outputIndexes": +[ 172 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 172, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Div_output_0", "outputIndexes": +[ 173 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 173, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 174 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 159, 174, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_1_output_0", "outputIndexes": +[ 175 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 175 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.1/self_attn/Neg_output_0", "outputIndexes": +[ 176 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 173, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 177 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 159, 20, 177, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_output_0", "outputIndexes": +[ 178 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 176, 178 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.1/self_attn/Concat_3_output_0", "outputIndexes": +[ 179 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 179, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_1_output_0", "outputIndexes": +[ 180 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 160, 180 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Add_output_0", "outputIndexes": +[ 181 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2926 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 132219056, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": +[ 2931 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2931 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 2932 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2932 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 182 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 183 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 156, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 184 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 183, 184, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.1/self_attn/Concat_1_output_0", "outputIndexes": +[ 185 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 182, 185 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/self_attn/Reshape_1_output_0", "outputIndexes": +[ 186 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 186, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_2_output_0", "outputIndexes": +[ 187 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 186 ] +, "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_3_output_0", "outputIndexes": +[ 188 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 188 ] +, "main_type": "NONE", "name": "Shape280", "outputIndexes": +[ 189 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 188 ] +, "main_type": "NONE", "name": "Rank282", "outputIndexes": +[ 190 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 190, 190 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp284", "outputIndexes": +[ 191 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 191 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze285", "outputIndexes": +[ 192 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 191, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp287", "outputIndexes": +[ 193 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 193 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze288", "outputIndexes": +[ 194 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 189, 192, 194, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice291", "outputIndexes": +[ 195 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 195 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze292", "outputIndexes": +[ 196 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 196 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp293", "outputIndexes": +[ 197 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 197, 196 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp294", "outputIndexes": +[ 198 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 188, 198, 191 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_3_output_0", "outputIndexes": +[ 199 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 199, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Div_1_output_0", "outputIndexes": +[ 200 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 200, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 201 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 186, 201, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_3_output_0", "outputIndexes": +[ 202 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 202 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.1/self_attn/Neg_1_output_0", "outputIndexes": +[ 203 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 200, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 204 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 186, 20, 204, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_2_output_0", "outputIndexes": +[ 205 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 203, 205 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.1/self_attn/Concat_4_output_0", "outputIndexes": +[ 206 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 206, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_3_output_0", "outputIndexes": +[ 207 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 187, 207 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Add_1_output_0", "outputIndexes": +[ 208 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2926 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 134578374, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": +[ 2935 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2935 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 2936 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2936 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 209 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 210 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 156, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 211 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 210, 211, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.1/self_attn/Concat_2_output_0", "outputIndexes": +[ 212 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 209, 212 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/self_attn/Reshape_2_output_0", "outputIndexes": +[ 213 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 181, 208, 213, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.1/self_attn/FusedAttention", "outputIndexes": +[ 214 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 214 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 2937 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2937 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 2938 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2938 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 136937692, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": +[ 2939 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2939 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 2940 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2940 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 215 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 135, 215 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/Add_output_0", "outputIndexes": +[ 216 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 216 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 146374898, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.1/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 217 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 217 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 2941 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2941 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 2942 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2942 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 146407666, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": +[ 2943 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2943 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 2944 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2944 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 218 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 218 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.1/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 219 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2942 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 179437832, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": +[ 2947 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2947 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 2948 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2948 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 220 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 219, 220 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/Mul_output_0", "outputIndexes": +[ 221 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 221 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 2949 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2949 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 2950 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2950 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 212467998, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": +[ 2951 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2951 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 2952 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2952 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 222 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 216, 222 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/Add_1_output_0", "outputIndexes": +[ 223 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 223, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/Reshape_output_0", "outputIndexes": +[ 224 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 224 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 245498164, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.2/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 225 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 225 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 2953 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2953 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 2954 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2954 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 245530932, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": +[ 2955 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2955 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 2956 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2956 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 226 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 225 ] +, "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_output_0", "outputIndexes": +[ 227 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 227 ] +, "main_type": "NONE", "name": "Shape340", "outputIndexes": +[ 228 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 227 ] +, "main_type": "NONE", "name": "Rank342", "outputIndexes": +[ 229 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 229, 229 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp344", "outputIndexes": +[ 230 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 230 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze345", "outputIndexes": +[ 231 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 230, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp347", "outputIndexes": +[ 232 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 232 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze348", "outputIndexes": +[ 233 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 228, 231, 233, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice351", "outputIndexes": +[ 234 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 234 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze352", "outputIndexes": +[ 235 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 235, 235 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp354", "outputIndexes": +[ 236 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 227, 236, 230 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_output_0", "outputIndexes": +[ 237 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 237, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 238 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 230 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze362", "outputIndexes": +[ 239 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 232 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze365", "outputIndexes": +[ 240 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 228, 239, 240, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice368", "outputIndexes": +[ 241 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 241 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze369", "outputIndexes": +[ 242 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 242 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp370", "outputIndexes": +[ 243 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 243, 242 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp371", "outputIndexes": +[ 244 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 227, 244, 230 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_1_output_0", "outputIndexes": +[ 245 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 245, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 246 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 238, 246, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.2/self_attn/Concat_output_0", "outputIndexes": +[ 247 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 226, 247 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/self_attn/Reshape_output_0", "outputIndexes": +[ 248 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 248, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_output_0", "outputIndexes": +[ 249 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 248 ] +, "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_2_output_0", "outputIndexes": +[ 250 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 250 ] +, "main_type": "NONE", "name": "Shape378", "outputIndexes": +[ 251 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 250 ] +, "main_type": "NONE", "name": "Rank380", "outputIndexes": +[ 252 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 252, 252 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp382", "outputIndexes": +[ 253 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 253 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze383", "outputIndexes": +[ 254 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 253, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp385", "outputIndexes": +[ 255 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 255 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze386", "outputIndexes": +[ 256 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 251, 254, 256, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice389", "outputIndexes": +[ 257 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 257 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze390", "outputIndexes": +[ 258 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 258 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp391", "outputIndexes": +[ 259 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 259, 258 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp392", "outputIndexes": +[ 260 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 250, 260, 253 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_2_output_0", "outputIndexes": +[ 261 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 261, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Div_output_0", "outputIndexes": +[ 262 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 262, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 263 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 248, 263, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_1_output_0", "outputIndexes": +[ 264 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 264 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.2/self_attn/Neg_output_0", "outputIndexes": +[ 265 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 262, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 266 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 248, 20, 266, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_output_0", "outputIndexes": +[ 267 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 265, 267 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.2/self_attn/Concat_3_output_0", "outputIndexes": +[ 268 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 268, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_1_output_0", "outputIndexes": +[ 269 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 249, 269 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Add_output_0", "outputIndexes": +[ 270 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2954 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 254968138, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": +[ 2959 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2959 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 2960 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2960 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 271 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 237, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 272 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 245, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 273 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 272, 273, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.2/self_attn/Concat_1_output_0", "outputIndexes": +[ 274 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 271, 274 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/self_attn/Reshape_1_output_0", "outputIndexes": +[ 275 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 275, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_2_output_0", "outputIndexes": +[ 276 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 275 ] +, "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_3_output_0", "outputIndexes": +[ 277 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 277 ] +, "main_type": "NONE", "name": "Shape411", "outputIndexes": +[ 278 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 277 ] +, "main_type": "NONE", "name": "Rank413", "outputIndexes": +[ 279 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 279, 279 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp415", "outputIndexes": +[ 280 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 280 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze416", "outputIndexes": +[ 281 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 280, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp418", "outputIndexes": +[ 282 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 282 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze419", "outputIndexes": +[ 283 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 278, 281, 283, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice422", "outputIndexes": +[ 284 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 284 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze423", "outputIndexes": +[ 285 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 285 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp424", "outputIndexes": +[ 286 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 286, 285 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp425", "outputIndexes": +[ 287 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 277, 287, 280 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_3_output_0", "outputIndexes": +[ 288 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 288, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Div_1_output_0", "outputIndexes": +[ 289 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 289, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 290 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 275, 290, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_3_output_0", "outputIndexes": +[ 291 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 291 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.2/self_attn/Neg_1_output_0", "outputIndexes": +[ 292 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 289, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 293 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 275, 20, 293, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_2_output_0", "outputIndexes": +[ 294 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 292, 294 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.2/self_attn/Concat_4_output_0", "outputIndexes": +[ 295 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 295, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_3_output_0", "outputIndexes": +[ 296 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 276, 296 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Add_1_output_0", "outputIndexes": +[ 297 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2954 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 257327456, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": +[ 2963 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2963 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 2964 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2964 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 298 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 237, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 299 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 245, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 300 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 299, 300, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.2/self_attn/Concat_2_output_0", "outputIndexes": +[ 301 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 298, 301 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/self_attn/Reshape_2_output_0", "outputIndexes": +[ 302 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 270, 297, 302, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.2/self_attn/FusedAttention", "outputIndexes": +[ 303 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 303 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 2965 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2965 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 2966 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2966 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 259686774, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": +[ 2967 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2967 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 2968 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2968 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 304 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 224, 304 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/Add_output_0", "outputIndexes": +[ 305 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 305 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 269123980, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.2/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 306 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 306 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 2969 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2969 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 2970 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2970 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 269156748, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": +[ 2971 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2971 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 2972 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2972 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 307 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 307 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.2/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 308 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2970 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 302186914, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": +[ 2975 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2975 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 2976 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2976 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 309 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 308, 309 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/Mul_output_0", "outputIndexes": +[ 310 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 310 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 2977 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2977 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 2978 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2978 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 335217080, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": +[ 2979 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2979 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 2980 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2980 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 311 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 305, 311 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/Add_1_output_0", "outputIndexes": +[ 312 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 312, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/Reshape_output_0", "outputIndexes": +[ 313 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 313 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 368247246, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.3/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 314 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 314 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 2981 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2981 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 2982 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2982 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 368280014, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": +[ 2983 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2983 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 2984 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2984 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 315 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 314 ] +, "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_output_0", "outputIndexes": +[ 316 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 316 ] +, "main_type": "NONE", "name": "Shape471", "outputIndexes": +[ 317 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 316 ] +, "main_type": "NONE", "name": "Rank473", "outputIndexes": +[ 318 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 318, 318 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp475", "outputIndexes": +[ 319 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 319 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze476", "outputIndexes": +[ 320 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 319, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp478", "outputIndexes": +[ 321 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 321 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze479", "outputIndexes": +[ 322 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 317, 320, 322, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice482", "outputIndexes": +[ 323 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 323 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze483", "outputIndexes": +[ 324 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 324, 324 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp485", "outputIndexes": +[ 325 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 316, 325, 319 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_output_0", "outputIndexes": +[ 326 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 326, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 327 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 319 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze493", "outputIndexes": +[ 328 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 321 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze496", "outputIndexes": +[ 329 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 317, 328, 329, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice499", "outputIndexes": +[ 330 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 330 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze500", "outputIndexes": +[ 331 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 331 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp501", "outputIndexes": +[ 332 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 332, 331 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp502", "outputIndexes": +[ 333 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 316, 333, 319 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_1_output_0", "outputIndexes": +[ 334 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 334, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 335 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 327, 335, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.3/self_attn/Concat_output_0", "outputIndexes": +[ 336 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 315, 336 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/self_attn/Reshape_output_0", "outputIndexes": +[ 337 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 337, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_output_0", "outputIndexes": +[ 338 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 337 ] +, "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_2_output_0", "outputIndexes": +[ 339 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 339 ] +, "main_type": "NONE", "name": "Shape509", "outputIndexes": +[ 340 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 339 ] +, "main_type": "NONE", "name": "Rank511", "outputIndexes": +[ 341 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 341, 341 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp513", "outputIndexes": +[ 342 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 342 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze514", "outputIndexes": +[ 343 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 342, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp516", "outputIndexes": +[ 344 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 344 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze517", "outputIndexes": +[ 345 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 340, 343, 345, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice520", "outputIndexes": +[ 346 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 346 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze521", "outputIndexes": +[ 347 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 347 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp522", "outputIndexes": +[ 348 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 348, 347 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp523", "outputIndexes": +[ 349 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 339, 349, 342 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_2_output_0", "outputIndexes": +[ 350 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 350, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Div_output_0", "outputIndexes": +[ 351 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 351, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 352 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 337, 352, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_1_output_0", "outputIndexes": +[ 353 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 353 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.3/self_attn/Neg_output_0", "outputIndexes": +[ 354 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 351, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 355 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 337, 20, 355, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_output_0", "outputIndexes": +[ 356 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 354, 356 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.3/self_attn/Concat_3_output_0", "outputIndexes": +[ 357 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 357, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_1_output_0", "outputIndexes": +[ 358 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 338, 358 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Add_output_0", "outputIndexes": +[ 359 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2982 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 377717220, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": +[ 2987 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2987 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 2988 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2988 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 360 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 326, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 361 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 334, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 362 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 361, 362, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.3/self_attn/Concat_1_output_0", "outputIndexes": +[ 363 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 360, 363 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/self_attn/Reshape_1_output_0", "outputIndexes": +[ 364 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 364, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_2_output_0", "outputIndexes": +[ 365 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 364 ] +, "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_3_output_0", "outputIndexes": +[ 366 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 366 ] +, "main_type": "NONE", "name": "Shape542", "outputIndexes": +[ 367 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 366 ] +, "main_type": "NONE", "name": "Rank544", "outputIndexes": +[ 368 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 368, 368 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp546", "outputIndexes": +[ 369 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 369 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze547", "outputIndexes": +[ 370 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 369, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp549", "outputIndexes": +[ 371 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 371 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze550", "outputIndexes": +[ 372 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 367, 370, 372, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice553", "outputIndexes": +[ 373 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 373 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze554", "outputIndexes": +[ 374 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 374 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp555", "outputIndexes": +[ 375 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 375, 374 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp556", "outputIndexes": +[ 376 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 366, 376, 369 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_3_output_0", "outputIndexes": +[ 377 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 377, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Div_1_output_0", "outputIndexes": +[ 378 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 378, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 379 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 364, 379, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_3_output_0", "outputIndexes": +[ 380 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 380 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.3/self_attn/Neg_1_output_0", "outputIndexes": +[ 381 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 378, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 382 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 364, 20, 382, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_2_output_0", "outputIndexes": +[ 383 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 381, 383 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.3/self_attn/Concat_4_output_0", "outputIndexes": +[ 384 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 384, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_3_output_0", "outputIndexes": +[ 385 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 365, 385 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Add_1_output_0", "outputIndexes": +[ 386 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2982 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 380076538, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": +[ 2991 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2991 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 2992 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2992 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 387 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 326, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 388 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 334, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 389 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 388, 389, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.3/self_attn/Concat_2_output_0", "outputIndexes": +[ 390 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 387, 390 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/self_attn/Reshape_2_output_0", "outputIndexes": +[ 391 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 359, 386, 391, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.3/self_attn/FusedAttention", "outputIndexes": +[ 392 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 392 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 2993 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2993 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 2994 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2994 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 382435856, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": +[ 2995 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2995 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 2996 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2996 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 393 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 313, 393 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/Add_output_0", "outputIndexes": +[ 394 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 394 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 391873062, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.3/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 395 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 395 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 2997 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2997 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 2998 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2998 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 391905830, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": +[ 2999 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2999 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3000 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3000 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 396 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 396 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.3/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 397 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2998 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 424935996, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": +[ 3003 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3003 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3004 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3004 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 398 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 397, 398 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/Mul_output_0", "outputIndexes": +[ 399 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 399 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3005 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3005 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3006 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3006 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 457966162, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": +[ 3007 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3007 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3008 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3008 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 400 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 394, 400 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/Add_1_output_0", "outputIndexes": +[ 401 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 401, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/Reshape_output_0", "outputIndexes": +[ 402 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 402 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 490996328, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.4/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 403 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 403 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3009 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3009 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3010 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3010 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 491029096, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": +[ 3011 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3011 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3012 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3012 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 404 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 403 ] +, "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_output_0", "outputIndexes": +[ 405 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 405 ] +, "main_type": "NONE", "name": "Shape602", "outputIndexes": +[ 406 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 405 ] +, "main_type": "NONE", "name": "Rank604", "outputIndexes": +[ 407 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 407, 407 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp606", "outputIndexes": +[ 408 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 408 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze607", "outputIndexes": +[ 409 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 408, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp609", "outputIndexes": +[ 410 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 410 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze610", "outputIndexes": +[ 411 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 406, 409, 411, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice613", "outputIndexes": +[ 412 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 412 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze614", "outputIndexes": +[ 413 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 413, 413 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp616", "outputIndexes": +[ 414 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 405, 414, 408 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_output_0", "outputIndexes": +[ 415 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 415, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 416 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 408 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze624", "outputIndexes": +[ 417 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 410 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze627", "outputIndexes": +[ 418 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 406, 417, 418, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice630", "outputIndexes": +[ 419 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 419 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze631", "outputIndexes": +[ 420 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 420 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp632", "outputIndexes": +[ 421 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 421, 420 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp633", "outputIndexes": +[ 422 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 405, 422, 408 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_1_output_0", "outputIndexes": +[ 423 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 423, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 424 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 416, 424, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.4/self_attn/Concat_output_0", "outputIndexes": +[ 425 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 404, 425 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/self_attn/Reshape_output_0", "outputIndexes": +[ 426 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 426, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_output_0", "outputIndexes": +[ 427 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 426 ] +, "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_2_output_0", "outputIndexes": +[ 428 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 428 ] +, "main_type": "NONE", "name": "Shape640", "outputIndexes": +[ 429 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 428 ] +, "main_type": "NONE", "name": "Rank642", "outputIndexes": +[ 430 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 430, 430 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp644", "outputIndexes": +[ 431 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 431 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze645", "outputIndexes": +[ 432 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 431, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp647", "outputIndexes": +[ 433 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 433 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze648", "outputIndexes": +[ 434 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 429, 432, 434, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice651", "outputIndexes": +[ 435 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 435 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze652", "outputIndexes": +[ 436 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 436 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp653", "outputIndexes": +[ 437 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 437, 436 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp654", "outputIndexes": +[ 438 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 428, 438, 431 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_2_output_0", "outputIndexes": +[ 439 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 439, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Div_output_0", "outputIndexes": +[ 440 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 440, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 441 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 426, 441, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_1_output_0", "outputIndexes": +[ 442 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 442 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.4/self_attn/Neg_output_0", "outputIndexes": +[ 443 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 440, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 444 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 426, 20, 444, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_output_0", "outputIndexes": +[ 445 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 443, 445 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.4/self_attn/Concat_3_output_0", "outputIndexes": +[ 446 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 446, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_1_output_0", "outputIndexes": +[ 447 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 427, 447 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Add_output_0", "outputIndexes": +[ 448 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3010 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 500466302, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": +[ 3015 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3015 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3016 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3016 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 449 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 415, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 450 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 423, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 451 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 450, 451, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.4/self_attn/Concat_1_output_0", "outputIndexes": +[ 452 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 449, 452 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/self_attn/Reshape_1_output_0", "outputIndexes": +[ 453 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 453, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_2_output_0", "outputIndexes": +[ 454 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 453 ] +, "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_3_output_0", "outputIndexes": +[ 455 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 455 ] +, "main_type": "NONE", "name": "Shape673", "outputIndexes": +[ 456 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 455 ] +, "main_type": "NONE", "name": "Rank675", "outputIndexes": +[ 457 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 457, 457 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp677", "outputIndexes": +[ 458 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 458 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze678", "outputIndexes": +[ 459 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 458, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp680", "outputIndexes": +[ 460 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 460 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze681", "outputIndexes": +[ 461 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 456, 459, 461, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice684", "outputIndexes": +[ 462 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 462 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze685", "outputIndexes": +[ 463 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 463 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp686", "outputIndexes": +[ 464 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 464, 463 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp687", "outputIndexes": +[ 465 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 455, 465, 458 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_3_output_0", "outputIndexes": +[ 466 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 466, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Div_1_output_0", "outputIndexes": +[ 467 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 467, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 468 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 453, 468, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_3_output_0", "outputIndexes": +[ 469 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 469 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.4/self_attn/Neg_1_output_0", "outputIndexes": +[ 470 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 467, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 471 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 453, 20, 471, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_2_output_0", "outputIndexes": +[ 472 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 470, 472 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.4/self_attn/Concat_4_output_0", "outputIndexes": +[ 473 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 473, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_3_output_0", "outputIndexes": +[ 474 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 454, 474 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Add_1_output_0", "outputIndexes": +[ 475 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3010 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 502825620, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": +[ 3019 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3019 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3020 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3020 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 476 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 415, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 477 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 423, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 478 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 477, 478, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.4/self_attn/Concat_2_output_0", "outputIndexes": +[ 479 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 476, 479 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/self_attn/Reshape_2_output_0", "outputIndexes": +[ 480 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 448, 475, 480, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.4/self_attn/FusedAttention", "outputIndexes": +[ 481 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 481 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3021 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3021 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3022 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3022 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 505184938, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": +[ 3023 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3023 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3024 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3024 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 482 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 402, 482 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/Add_output_0", "outputIndexes": +[ 483 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 483 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 514622144, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.4/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 484 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 484 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3025 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3025 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3026 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3026 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 514654912, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": +[ 3027 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3027 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3028 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3028 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 485 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 485 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.4/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 486 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3026 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 547685078, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": +[ 3031 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3031 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3032 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3032 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 487 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 486, 487 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/Mul_output_0", "outputIndexes": +[ 488 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 488 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3033 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3033 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3034 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3034 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 580715244, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": +[ 3035 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3035 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3036 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3036 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 489 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 483, 489 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/Add_1_output_0", "outputIndexes": +[ 490 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 490, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/Reshape_output_0", "outputIndexes": +[ 491 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 491 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 613745410, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.5/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 492 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 492 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3037 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3037 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3038 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3038 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 613778178, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": +[ 3039 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3039 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3040 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3040 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 493 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 492 ] +, "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_output_0", "outputIndexes": +[ 494 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 494 ] +, "main_type": "NONE", "name": "Shape733", "outputIndexes": +[ 495 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 494 ] +, "main_type": "NONE", "name": "Rank735", "outputIndexes": +[ 496 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 496, 496 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp737", "outputIndexes": +[ 497 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 497 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze738", "outputIndexes": +[ 498 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 497, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp740", "outputIndexes": +[ 499 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 499 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze741", "outputIndexes": +[ 500 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 495, 498, 500, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice744", "outputIndexes": +[ 501 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 501 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze745", "outputIndexes": +[ 502 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 502, 502 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp747", "outputIndexes": +[ 503 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 494, 503, 497 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_output_0", "outputIndexes": +[ 504 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 504, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 505 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 497 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze755", "outputIndexes": +[ 506 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 499 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze758", "outputIndexes": +[ 507 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 495, 506, 507, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice761", "outputIndexes": +[ 508 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 508 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze762", "outputIndexes": +[ 509 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 509 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp763", "outputIndexes": +[ 510 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 510, 509 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp764", "outputIndexes": +[ 511 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 494, 511, 497 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_1_output_0", "outputIndexes": +[ 512 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 512, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 513 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 505, 513, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.5/self_attn/Concat_output_0", "outputIndexes": +[ 514 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 493, 514 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/self_attn/Reshape_output_0", "outputIndexes": +[ 515 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 515, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_output_0", "outputIndexes": +[ 516 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 515 ] +, "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_2_output_0", "outputIndexes": +[ 517 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 517 ] +, "main_type": "NONE", "name": "Shape771", "outputIndexes": +[ 518 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 517 ] +, "main_type": "NONE", "name": "Rank773", "outputIndexes": +[ 519 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 519, 519 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp775", "outputIndexes": +[ 520 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 520 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze776", "outputIndexes": +[ 521 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 520, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp778", "outputIndexes": +[ 522 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 522 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze779", "outputIndexes": +[ 523 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 518, 521, 523, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice782", "outputIndexes": +[ 524 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 524 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze783", "outputIndexes": +[ 525 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 525 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp784", "outputIndexes": +[ 526 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 526, 525 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp785", "outputIndexes": +[ 527 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 517, 527, 520 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_2_output_0", "outputIndexes": +[ 528 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 528, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Div_output_0", "outputIndexes": +[ 529 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 529, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 530 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 515, 530, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_1_output_0", "outputIndexes": +[ 531 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 531 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.5/self_attn/Neg_output_0", "outputIndexes": +[ 532 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 529, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 533 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 515, 20, 533, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_output_0", "outputIndexes": +[ 534 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 532, 534 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.5/self_attn/Concat_3_output_0", "outputIndexes": +[ 535 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 535, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_1_output_0", "outputIndexes": +[ 536 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 516, 536 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Add_output_0", "outputIndexes": +[ 537 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3038 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 623215384, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": +[ 3043 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3043 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3044 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3044 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 538 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 504, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 539 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 512, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 540 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 539, 540, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.5/self_attn/Concat_1_output_0", "outputIndexes": +[ 541 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 538, 541 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/self_attn/Reshape_1_output_0", "outputIndexes": +[ 542 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 542, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_2_output_0", "outputIndexes": +[ 543 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 542 ] +, "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_3_output_0", "outputIndexes": +[ 544 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 544 ] +, "main_type": "NONE", "name": "Shape804", "outputIndexes": +[ 545 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 544 ] +, "main_type": "NONE", "name": "Rank806", "outputIndexes": +[ 546 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 546, 546 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp808", "outputIndexes": +[ 547 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 547 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze809", "outputIndexes": +[ 548 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 547, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp811", "outputIndexes": +[ 549 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 549 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze812", "outputIndexes": +[ 550 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 545, 548, 550, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice815", "outputIndexes": +[ 551 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 551 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze816", "outputIndexes": +[ 552 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 552 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp817", "outputIndexes": +[ 553 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 553, 552 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp818", "outputIndexes": +[ 554 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 544, 554, 547 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_3_output_0", "outputIndexes": +[ 555 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 555, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Div_1_output_0", "outputIndexes": +[ 556 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 556, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 557 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 542, 557, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_3_output_0", "outputIndexes": +[ 558 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 558 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.5/self_attn/Neg_1_output_0", "outputIndexes": +[ 559 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 556, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 560 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 542, 20, 560, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_2_output_0", "outputIndexes": +[ 561 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 559, 561 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.5/self_attn/Concat_4_output_0", "outputIndexes": +[ 562 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 562, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_3_output_0", "outputIndexes": +[ 563 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 543, 563 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Add_1_output_0", "outputIndexes": +[ 564 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3038 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 625574702, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": +[ 3047 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3047 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3048 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3048 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 565 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 504, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 566 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 512, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 567 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 566, 567, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.5/self_attn/Concat_2_output_0", "outputIndexes": +[ 568 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 565, 568 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/self_attn/Reshape_2_output_0", "outputIndexes": +[ 569 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 537, 564, 569, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.5/self_attn/FusedAttention", "outputIndexes": +[ 570 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 570 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3049 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3049 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3050 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3050 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 627934020, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": +[ 3051 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3051 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3052 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3052 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 571 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 491, 571 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/Add_output_0", "outputIndexes": +[ 572 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 572 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 637371226, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.5/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 573 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 573 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3053 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3053 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3054 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3054 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 637403994, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": +[ 3055 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3055 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3056 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3056 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 574 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 574 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.5/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 575 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3054 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 670434160, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": +[ 3059 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3059 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3060 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3060 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 576 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 575, 576 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/Mul_output_0", "outputIndexes": +[ 577 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 577 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3061 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3061 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3062 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3062 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 703464326, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": +[ 3063 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3063 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3064 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3064 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 578 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 572, 578 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/Add_1_output_0", "outputIndexes": +[ 579 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 579, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/Reshape_output_0", "outputIndexes": +[ 580 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 580 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 736494492, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.6/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 581 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 581 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3065 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3065 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3066 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3066 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 736527260, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": +[ 3067 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3067 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3068 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3068 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 582 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 581 ] +, "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_output_0", "outputIndexes": +[ 583 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 583 ] +, "main_type": "NONE", "name": "Shape864", "outputIndexes": +[ 584 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 583 ] +, "main_type": "NONE", "name": "Rank866", "outputIndexes": +[ 585 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 585, 585 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp868", "outputIndexes": +[ 586 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 586 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze869", "outputIndexes": +[ 587 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 586, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp871", "outputIndexes": +[ 588 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 588 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze872", "outputIndexes": +[ 589 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 584, 587, 589, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice875", "outputIndexes": +[ 590 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 590 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze876", "outputIndexes": +[ 591 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 591, 591 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp878", "outputIndexes": +[ 592 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 583, 592, 586 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_output_0", "outputIndexes": +[ 593 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 593, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 594 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 586 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze886", "outputIndexes": +[ 595 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 588 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze889", "outputIndexes": +[ 596 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 584, 595, 596, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice892", "outputIndexes": +[ 597 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 597 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze893", "outputIndexes": +[ 598 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 598 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp894", "outputIndexes": +[ 599 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 599, 598 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp895", "outputIndexes": +[ 600 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 583, 600, 586 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_1_output_0", "outputIndexes": +[ 601 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 602 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 594, 602, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.6/self_attn/Concat_output_0", "outputIndexes": +[ 603 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 582, 603 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/self_attn/Reshape_output_0", "outputIndexes": +[ 604 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 604, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_output_0", "outputIndexes": +[ 605 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 604 ] +, "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_2_output_0", "outputIndexes": +[ 606 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 606 ] +, "main_type": "NONE", "name": "Shape902", "outputIndexes": +[ 607 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 606 ] +, "main_type": "NONE", "name": "Rank904", "outputIndexes": +[ 608 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 608, 608 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp906", "outputIndexes": +[ 609 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 609 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze907", "outputIndexes": +[ 610 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 609, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp909", "outputIndexes": +[ 611 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 611 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze910", "outputIndexes": +[ 612 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 607, 610, 612, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice913", "outputIndexes": +[ 613 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 613 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze914", "outputIndexes": +[ 614 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 614 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp915", "outputIndexes": +[ 615 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 615, 614 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp916", "outputIndexes": +[ 616 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 606, 616, 609 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_2_output_0", "outputIndexes": +[ 617 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 617, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Div_output_0", "outputIndexes": +[ 618 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 618, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 619 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 604, 619, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_1_output_0", "outputIndexes": +[ 620 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 620 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.6/self_attn/Neg_output_0", "outputIndexes": +[ 621 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 618, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 622 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 604, 20, 622, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_output_0", "outputIndexes": +[ 623 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 621, 623 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.6/self_attn/Concat_3_output_0", "outputIndexes": +[ 624 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 624, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_1_output_0", "outputIndexes": +[ 625 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 605, 625 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Add_output_0", "outputIndexes": +[ 626 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3066 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 745964466, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": +[ 3071 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3071 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3072 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3072 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 627 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 593, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 628 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 629 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 628, 629, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.6/self_attn/Concat_1_output_0", "outputIndexes": +[ 630 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 627, 630 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/self_attn/Reshape_1_output_0", "outputIndexes": +[ 631 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 631, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_2_output_0", "outputIndexes": +[ 632 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 631 ] +, "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_3_output_0", "outputIndexes": +[ 633 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 633 ] +, "main_type": "NONE", "name": "Shape935", "outputIndexes": +[ 634 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 633 ] +, "main_type": "NONE", "name": "Rank937", "outputIndexes": +[ 635 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 635, 635 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp939", "outputIndexes": +[ 636 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 636 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze940", "outputIndexes": +[ 637 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 636, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp942", "outputIndexes": +[ 638 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 638 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze943", "outputIndexes": +[ 639 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 634, 637, 639, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice946", "outputIndexes": +[ 640 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 640 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze947", "outputIndexes": +[ 641 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 641 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp948", "outputIndexes": +[ 642 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 642, 641 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp949", "outputIndexes": +[ 643 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 633, 643, 636 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_3_output_0", "outputIndexes": +[ 644 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 644, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Div_1_output_0", "outputIndexes": +[ 645 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 645, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 646 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 631, 646, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_3_output_0", "outputIndexes": +[ 647 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 647 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.6/self_attn/Neg_1_output_0", "outputIndexes": +[ 648 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 645, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 649 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 631, 20, 649, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_2_output_0", "outputIndexes": +[ 650 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 648, 650 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.6/self_attn/Concat_4_output_0", "outputIndexes": +[ 651 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 651, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_3_output_0", "outputIndexes": +[ 652 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 632, 652 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Add_1_output_0", "outputIndexes": +[ 653 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3066 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 748323784, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": +[ 3075 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3075 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3076 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3076 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 654 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 593, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 655 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 656 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 655, 656, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.6/self_attn/Concat_2_output_0", "outputIndexes": +[ 657 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 654, 657 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/self_attn/Reshape_2_output_0", "outputIndexes": +[ 658 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 626, 653, 658, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.6/self_attn/FusedAttention", "outputIndexes": +[ 659 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 659 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3077 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3077 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3078 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3078 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 750683102, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": +[ 3079 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3079 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3080 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3080 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 660 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 580, 660 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/Add_output_0", "outputIndexes": +[ 661 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 661 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 760120308, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.6/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 662 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 662 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3081 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3081 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3082 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3082 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 760153076, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": +[ 3083 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3083 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3084 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3084 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 663 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 663 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.6/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 664 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3082 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 793183242, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": +[ 3087 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3087 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3088 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3088 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 665 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 664, 665 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/Mul_output_0", "outputIndexes": +[ 666 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 666 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3089 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3089 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3090 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3090 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 826213408, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": +[ 3091 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3091 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3092 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3092 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 667 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 661, 667 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/Add_1_output_0", "outputIndexes": +[ 668 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 668, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/Reshape_output_0", "outputIndexes": +[ 669 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 669 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 859243574, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.7/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 670 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 670 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3093 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3093 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3094 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3094 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 859276342, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": +[ 3095 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3095 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3096 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3096 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 671 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 670 ] +, "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_output_0", "outputIndexes": +[ 672 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 672 ] +, "main_type": "NONE", "name": "Shape995", "outputIndexes": +[ 673 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 672 ] +, "main_type": "NONE", "name": "Rank997", "outputIndexes": +[ 674 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 674, 674 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp999", "outputIndexes": +[ 675 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 675 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1000", "outputIndexes": +[ 676 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 675, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1002", "outputIndexes": +[ 677 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 677 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1003", "outputIndexes": +[ 678 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 673, 676, 678, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1006", "outputIndexes": +[ 679 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 679 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1007", "outputIndexes": +[ 680 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 680, 680 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1009", "outputIndexes": +[ 681 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 672, 681, 675 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_output_0", "outputIndexes": +[ 682 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 682, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 683 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 675 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1017", "outputIndexes": +[ 684 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 677 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1020", "outputIndexes": +[ 685 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 673, 684, 685, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1023", "outputIndexes": +[ 686 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 686 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1024", "outputIndexes": +[ 687 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 687 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1025", "outputIndexes": +[ 688 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 688, 687 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1026", "outputIndexes": +[ 689 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 672, 689, 675 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_1_output_0", "outputIndexes": +[ 690 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 690, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 691 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 683, 691, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.7/self_attn/Concat_output_0", "outputIndexes": +[ 692 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 671, 692 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/self_attn/Reshape_output_0", "outputIndexes": +[ 693 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 693, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_output_0", "outputIndexes": +[ 694 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 693 ] +, "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_2_output_0", "outputIndexes": +[ 695 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 695 ] +, "main_type": "NONE", "name": "Shape1033", "outputIndexes": +[ 696 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 695 ] +, "main_type": "NONE", "name": "Rank1035", "outputIndexes": +[ 697 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 697, 697 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1037", "outputIndexes": +[ 698 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 698 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1038", "outputIndexes": +[ 699 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 698, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1040", "outputIndexes": +[ 700 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 700 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1041", "outputIndexes": +[ 701 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 696, 699, 701, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1044", "outputIndexes": +[ 702 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 702 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1045", "outputIndexes": +[ 703 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 703 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1046", "outputIndexes": +[ 704 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 704, 703 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1047", "outputIndexes": +[ 705 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 695, 705, 698 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_2_output_0", "outputIndexes": +[ 706 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 706, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Div_output_0", "outputIndexes": +[ 707 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 707, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 708 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 693, 708, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_1_output_0", "outputIndexes": +[ 709 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 709 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.7/self_attn/Neg_output_0", "outputIndexes": +[ 710 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 707, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 711 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 693, 20, 711, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_output_0", "outputIndexes": +[ 712 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 710, 712 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.7/self_attn/Concat_3_output_0", "outputIndexes": +[ 713 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 713, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_1_output_0", "outputIndexes": +[ 714 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 694, 714 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Add_output_0", "outputIndexes": +[ 715 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3094 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 868713548, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": +[ 3099 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3099 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3100 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3100 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 716 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 682, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 717 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 690, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 718 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 717, 718, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.7/self_attn/Concat_1_output_0", "outputIndexes": +[ 719 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 716, 719 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/self_attn/Reshape_1_output_0", "outputIndexes": +[ 720 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 720, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_2_output_0", "outputIndexes": +[ 721 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 720 ] +, "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_3_output_0", "outputIndexes": +[ 722 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 722 ] +, "main_type": "NONE", "name": "Shape1066", "outputIndexes": +[ 723 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 722 ] +, "main_type": "NONE", "name": "Rank1068", "outputIndexes": +[ 724 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 724, 724 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1070", "outputIndexes": +[ 725 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 725 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1071", "outputIndexes": +[ 726 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 725, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1073", "outputIndexes": +[ 727 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 727 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1074", "outputIndexes": +[ 728 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 723, 726, 728, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1077", "outputIndexes": +[ 729 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 729 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1078", "outputIndexes": +[ 730 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 730 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1079", "outputIndexes": +[ 731 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 731, 730 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1080", "outputIndexes": +[ 732 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 722, 732, 725 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_3_output_0", "outputIndexes": +[ 733 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 733, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Div_1_output_0", "outputIndexes": +[ 734 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 734, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 735 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 720, 735, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_3_output_0", "outputIndexes": +[ 736 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 736 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.7/self_attn/Neg_1_output_0", "outputIndexes": +[ 737 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 734, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 738 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 720, 20, 738, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_2_output_0", "outputIndexes": +[ 739 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 737, 739 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.7/self_attn/Concat_4_output_0", "outputIndexes": +[ 740 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 740, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_3_output_0", "outputIndexes": +[ 741 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 721, 741 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Add_1_output_0", "outputIndexes": +[ 742 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3094 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 871072866, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": +[ 3103 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3103 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3104 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3104 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 743 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 682, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 744 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 690, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 745 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 744, 745, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.7/self_attn/Concat_2_output_0", "outputIndexes": +[ 746 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 743, 746 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/self_attn/Reshape_2_output_0", "outputIndexes": +[ 747 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 715, 742, 747, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.7/self_attn/FusedAttention", "outputIndexes": +[ 748 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 748 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3105 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3105 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3106 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3106 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 873432184, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": +[ 3107 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3107 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3108 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3108 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 749 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 669, 749 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/Add_output_0", "outputIndexes": +[ 750 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 750 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 882869390, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.7/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 751 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 751 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3109 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3109 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3110 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3110 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 882902158, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": +[ 3111 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3111 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3112 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3112 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 752 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 752 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.7/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 753 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3110 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 915932324, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": +[ 3115 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3115 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3116 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3116 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 754 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 753, 754 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/Mul_output_0", "outputIndexes": +[ 755 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 755 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3117 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3117 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3118 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3118 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 948962490, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": +[ 3119 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3119 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3120 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3120 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 756 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 750, 756 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/Add_1_output_0", "outputIndexes": +[ 757 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 757, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/Reshape_output_0", "outputIndexes": +[ 758 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 758 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 981992656, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.8/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 759 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 759 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3121 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3121 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3122 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3122 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 982025424, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": +[ 3123 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3123 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3124 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3124 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 760 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 759 ] +, "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_output_0", "outputIndexes": +[ 761 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 761 ] +, "main_type": "NONE", "name": "Shape1126", "outputIndexes": +[ 762 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 761 ] +, "main_type": "NONE", "name": "Rank1128", "outputIndexes": +[ 763 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 763, 763 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1130", "outputIndexes": +[ 764 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 764 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1131", "outputIndexes": +[ 765 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 764, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1133", "outputIndexes": +[ 766 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 766 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1134", "outputIndexes": +[ 767 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 762, 765, 767, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1137", "outputIndexes": +[ 768 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 768 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1138", "outputIndexes": +[ 769 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 769, 769 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1140", "outputIndexes": +[ 770 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 761, 770, 764 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_output_0", "outputIndexes": +[ 771 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 771, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 772 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 764 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1148", "outputIndexes": +[ 773 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 766 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1151", "outputIndexes": +[ 774 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 762, 773, 774, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1154", "outputIndexes": +[ 775 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 775 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1155", "outputIndexes": +[ 776 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 776 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1156", "outputIndexes": +[ 777 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 777, 776 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1157", "outputIndexes": +[ 778 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 761, 778, 764 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_1_output_0", "outputIndexes": +[ 779 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 779, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 780 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 772, 780, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.8/self_attn/Concat_output_0", "outputIndexes": +[ 781 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 760, 781 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/self_attn/Reshape_output_0", "outputIndexes": +[ 782 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 782, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_output_0", "outputIndexes": +[ 783 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 782 ] +, "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_2_output_0", "outputIndexes": +[ 784 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 784 ] +, "main_type": "NONE", "name": "Shape1164", "outputIndexes": +[ 785 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 784 ] +, "main_type": "NONE", "name": "Rank1166", "outputIndexes": +[ 786 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 786, 786 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1168", "outputIndexes": +[ 787 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 787 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1169", "outputIndexes": +[ 788 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 787, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1171", "outputIndexes": +[ 789 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 789 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1172", "outputIndexes": +[ 790 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 785, 788, 790, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1175", "outputIndexes": +[ 791 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 791 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1176", "outputIndexes": +[ 792 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 792 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1177", "outputIndexes": +[ 793 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 793, 792 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1178", "outputIndexes": +[ 794 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 784, 794, 787 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_2_output_0", "outputIndexes": +[ 795 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 795, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Div_output_0", "outputIndexes": +[ 796 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 796, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 797 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 782, 797, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_1_output_0", "outputIndexes": +[ 798 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 798 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.8/self_attn/Neg_output_0", "outputIndexes": +[ 799 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 796, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 800 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 782, 20, 800, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_output_0", "outputIndexes": +[ 801 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 799, 801 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.8/self_attn/Concat_3_output_0", "outputIndexes": +[ 802 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 802, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_1_output_0", "outputIndexes": +[ 803 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 783, 803 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Add_output_0", "outputIndexes": +[ 804 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3122 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 991462630, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": +[ 3127 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3127 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3128 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3128 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 805 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 771, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 806 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 779, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 807 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 806, 807, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.8/self_attn/Concat_1_output_0", "outputIndexes": +[ 808 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 805, 808 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/self_attn/Reshape_1_output_0", "outputIndexes": +[ 809 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 809, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_2_output_0", "outputIndexes": +[ 810 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 809 ] +, "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_3_output_0", "outputIndexes": +[ 811 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 811 ] +, "main_type": "NONE", "name": "Shape1197", "outputIndexes": +[ 812 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 811 ] +, "main_type": "NONE", "name": "Rank1199", "outputIndexes": +[ 813 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 813, 813 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1201", "outputIndexes": +[ 814 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 814 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1202", "outputIndexes": +[ 815 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 814, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1204", "outputIndexes": +[ 816 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 816 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1205", "outputIndexes": +[ 817 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 812, 815, 817, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1208", "outputIndexes": +[ 818 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 818 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1209", "outputIndexes": +[ 819 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 819 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1210", "outputIndexes": +[ 820 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 820, 819 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1211", "outputIndexes": +[ 821 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 811, 821, 814 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_3_output_0", "outputIndexes": +[ 822 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 822, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Div_1_output_0", "outputIndexes": +[ 823 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 823, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 824 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 809, 824, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_3_output_0", "outputIndexes": +[ 825 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 825 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.8/self_attn/Neg_1_output_0", "outputIndexes": +[ 826 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 823, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 827 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 809, 20, 827, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_2_output_0", "outputIndexes": +[ 828 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 826, 828 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.8/self_attn/Concat_4_output_0", "outputIndexes": +[ 829 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 829, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_3_output_0", "outputIndexes": +[ 830 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 810, 830 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Add_1_output_0", "outputIndexes": +[ 831 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3122 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 993821948, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": +[ 3131 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3131 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3132 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3132 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 832 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 771, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 833 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 779, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 834 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 833, 834, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.8/self_attn/Concat_2_output_0", "outputIndexes": +[ 835 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 832, 835 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/self_attn/Reshape_2_output_0", "outputIndexes": +[ 836 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 804, 831, 836, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.8/self_attn/FusedAttention", "outputIndexes": +[ 837 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 837 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3133 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3133 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3134 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3134 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 996181266, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": +[ 3135 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3135 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3136 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3136 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 838 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 758, 838 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/Add_output_0", "outputIndexes": +[ 839 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 839 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1005618472, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.8/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 840 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 840 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3137 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3137 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3138 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3138 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1005651240, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": +[ 3139 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3139 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3140 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3140 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 841 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 841 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.8/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 842 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3138 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1038681406, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": +[ 3143 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3143 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3144 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3144 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 843 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 842, 843 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/Mul_output_0", "outputIndexes": +[ 844 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 844 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3145 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3145 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3146 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3146 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1071711572, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": +[ 3147 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3147 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3148 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3148 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 845 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 839, 845 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/Add_1_output_0", "outputIndexes": +[ 846 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 846, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/Reshape_output_0", "outputIndexes": +[ 847 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 847 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1104741738, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.9/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 848 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 848 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3149 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3149 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3150 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3150 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1104774506, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": +[ 3151 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3151 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3152 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3152 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 849 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 848 ] +, "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_output_0", "outputIndexes": +[ 850 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 850 ] +, "main_type": "NONE", "name": "Shape1257", "outputIndexes": +[ 851 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 850 ] +, "main_type": "NONE", "name": "Rank1259", "outputIndexes": +[ 852 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 852, 852 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1261", "outputIndexes": +[ 853 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 853 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1262", "outputIndexes": +[ 854 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 853, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1264", "outputIndexes": +[ 855 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 855 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1265", "outputIndexes": +[ 856 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 851, 854, 856, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1268", "outputIndexes": +[ 857 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 857 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1269", "outputIndexes": +[ 858 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 858, 858 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1271", "outputIndexes": +[ 859 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 850, 859, 853 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_output_0", "outputIndexes": +[ 860 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 860, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 861 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 853 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1279", "outputIndexes": +[ 862 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 855 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1282", "outputIndexes": +[ 863 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 851, 862, 863, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1285", "outputIndexes": +[ 864 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 864 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1286", "outputIndexes": +[ 865 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 865 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1287", "outputIndexes": +[ 866 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 866, 865 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1288", "outputIndexes": +[ 867 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 850, 867, 853 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_1_output_0", "outputIndexes": +[ 868 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 868, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 869 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 861, 869, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.9/self_attn/Concat_output_0", "outputIndexes": +[ 870 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 849, 870 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/self_attn/Reshape_output_0", "outputIndexes": +[ 871 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 871, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_output_0", "outputIndexes": +[ 872 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 871 ] +, "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_2_output_0", "outputIndexes": +[ 873 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 873 ] +, "main_type": "NONE", "name": "Shape1295", "outputIndexes": +[ 874 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 873 ] +, "main_type": "NONE", "name": "Rank1297", "outputIndexes": +[ 875 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 875, 875 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1299", "outputIndexes": +[ 876 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 876 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1300", "outputIndexes": +[ 877 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 876, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1302", "outputIndexes": +[ 878 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 878 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1303", "outputIndexes": +[ 879 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 874, 877, 879, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1306", "outputIndexes": +[ 880 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 880 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1307", "outputIndexes": +[ 881 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 881 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1308", "outputIndexes": +[ 882 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 882, 881 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1309", "outputIndexes": +[ 883 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 873, 883, 876 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_2_output_0", "outputIndexes": +[ 884 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 884, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Div_output_0", "outputIndexes": +[ 885 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 885, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 886 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 871, 886, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_1_output_0", "outputIndexes": +[ 887 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 887 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.9/self_attn/Neg_output_0", "outputIndexes": +[ 888 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 885, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 889 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 871, 20, 889, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_output_0", "outputIndexes": +[ 890 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 888, 890 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.9/self_attn/Concat_3_output_0", "outputIndexes": +[ 891 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 891, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_1_output_0", "outputIndexes": +[ 892 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 872, 892 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Add_output_0", "outputIndexes": +[ 893 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3150 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1114211712, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": +[ 3155 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3155 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3156 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3156 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 894 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 860, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 895 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 868, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 896 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 895, 896, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.9/self_attn/Concat_1_output_0", "outputIndexes": +[ 897 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 894, 897 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/self_attn/Reshape_1_output_0", "outputIndexes": +[ 898 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 898, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_2_output_0", "outputIndexes": +[ 899 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 898 ] +, "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_3_output_0", "outputIndexes": +[ 900 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 900 ] +, "main_type": "NONE", "name": "Shape1328", "outputIndexes": +[ 901 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 900 ] +, "main_type": "NONE", "name": "Rank1330", "outputIndexes": +[ 902 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 902, 902 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1332", "outputIndexes": +[ 903 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 903 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1333", "outputIndexes": +[ 904 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 903, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1335", "outputIndexes": +[ 905 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 905 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1336", "outputIndexes": +[ 906 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 901, 904, 906, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1339", "outputIndexes": +[ 907 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 907 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1340", "outputIndexes": +[ 908 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 908 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1341", "outputIndexes": +[ 909 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 909, 908 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1342", "outputIndexes": +[ 910 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 900, 910, 903 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_3_output_0", "outputIndexes": +[ 911 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 911, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Div_1_output_0", "outputIndexes": +[ 912 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 912, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 913 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 898, 913, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_3_output_0", "outputIndexes": +[ 914 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 914 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.9/self_attn/Neg_1_output_0", "outputIndexes": +[ 915 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 912, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 916 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 898, 20, 916, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_2_output_0", "outputIndexes": +[ 917 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 915, 917 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.9/self_attn/Concat_4_output_0", "outputIndexes": +[ 918 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 918, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_3_output_0", "outputIndexes": +[ 919 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 899, 919 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Add_1_output_0", "outputIndexes": +[ 920 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3150 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1116571030, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": +[ 3159 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3159 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3160 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3160 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 921 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 860, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 922 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 868, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 923 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 922, 923, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.9/self_attn/Concat_2_output_0", "outputIndexes": +[ 924 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 921, 924 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/self_attn/Reshape_2_output_0", "outputIndexes": +[ 925 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 893, 920, 925, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.9/self_attn/FusedAttention", "outputIndexes": +[ 926 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 926 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3161 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3161 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3162 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3162 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1118930348, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": +[ 3163 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3163 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3164 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3164 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 927 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 847, 927 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/Add_output_0", "outputIndexes": +[ 928 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 928 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1128367554, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.9/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 929 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 929 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3165 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3165 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3166 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3166 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1128400322, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": +[ 3167 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3167 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3168 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3168 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 930 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 930 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.9/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 931 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3166 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1161430488, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": +[ 3171 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3171 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3172 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3172 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 932 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 931, 932 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/Mul_output_0", "outputIndexes": +[ 933 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 933 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3173 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3173 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3174 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3174 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1194460654, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": +[ 3175 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3175 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3176 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3176 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 934 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 928, 934 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/Add_1_output_0", "outputIndexes": +[ 935 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 935, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/Reshape_output_0", "outputIndexes": +[ 936 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 936 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1227490820, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.10/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 937 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 937 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3177 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3177 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3178 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3178 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1227523588, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": +[ 3179 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3179 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3180 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3180 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 938 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 937 ] +, "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_output_0", "outputIndexes": +[ 939 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 939 ] +, "main_type": "NONE", "name": "Shape1388", "outputIndexes": +[ 940 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 939 ] +, "main_type": "NONE", "name": "Rank1390", "outputIndexes": +[ 941 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 941, 941 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1392", "outputIndexes": +[ 942 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 942 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1393", "outputIndexes": +[ 943 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 942, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1395", "outputIndexes": +[ 944 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 944 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1396", "outputIndexes": +[ 945 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 940, 943, 945, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1399", "outputIndexes": +[ 946 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 946 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1400", "outputIndexes": +[ 947 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 947, 947 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1402", "outputIndexes": +[ 948 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 939, 948, 942 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_output_0", "outputIndexes": +[ 949 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 949, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 950 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 942 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1410", "outputIndexes": +[ 951 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 944 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1413", "outputIndexes": +[ 952 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 940, 951, 952, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1416", "outputIndexes": +[ 953 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 953 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1417", "outputIndexes": +[ 954 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 954 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1418", "outputIndexes": +[ 955 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 955, 954 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1419", "outputIndexes": +[ 956 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 939, 956, 942 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_1_output_0", "outputIndexes": +[ 957 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 957, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 958 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 950, 958, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.10/self_attn/Concat_output_0", "outputIndexes": +[ 959 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 938, 959 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/self_attn/Reshape_output_0", "outputIndexes": +[ 960 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 960, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_output_0", "outputIndexes": +[ 961 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 960 ] +, "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_2_output_0", "outputIndexes": +[ 962 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 962 ] +, "main_type": "NONE", "name": "Shape1426", "outputIndexes": +[ 963 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 962 ] +, "main_type": "NONE", "name": "Rank1428", "outputIndexes": +[ 964 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 964, 964 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1430", "outputIndexes": +[ 965 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 965 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1431", "outputIndexes": +[ 966 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 965, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1433", "outputIndexes": +[ 967 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 967 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1434", "outputIndexes": +[ 968 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 963, 966, 968, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1437", "outputIndexes": +[ 969 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 969 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1438", "outputIndexes": +[ 970 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 970 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1439", "outputIndexes": +[ 971 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 971, 970 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1440", "outputIndexes": +[ 972 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 962, 972, 965 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_2_output_0", "outputIndexes": +[ 973 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 973, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Div_output_0", "outputIndexes": +[ 974 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 974, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 975 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 960, 975, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_1_output_0", "outputIndexes": +[ 976 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 976 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.10/self_attn/Neg_output_0", "outputIndexes": +[ 977 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 974, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 978 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 960, 20, 978, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_output_0", "outputIndexes": +[ 979 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 977, 979 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.10/self_attn/Concat_3_output_0", "outputIndexes": +[ 980 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 980, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_1_output_0", "outputIndexes": +[ 981 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 961, 981 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Add_output_0", "outputIndexes": +[ 982 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3178 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1236960794, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": +[ 3183 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3183 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3184 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3184 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 983 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 949, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 984 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 957, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 985 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 984, 985, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.10/self_attn/Concat_1_output_0", "outputIndexes": +[ 986 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 983, 986 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/self_attn/Reshape_1_output_0", "outputIndexes": +[ 987 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 987, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_2_output_0", "outputIndexes": +[ 988 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 987 ] +, "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_3_output_0", "outputIndexes": +[ 989 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 989 ] +, "main_type": "NONE", "name": "Shape1459", "outputIndexes": +[ 990 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 989 ] +, "main_type": "NONE", "name": "Rank1461", "outputIndexes": +[ 991 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 991, 991 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1463", "outputIndexes": +[ 992 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 992 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1464", "outputIndexes": +[ 993 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 992, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1466", "outputIndexes": +[ 994 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 994 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1467", "outputIndexes": +[ 995 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 990, 993, 995, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1470", "outputIndexes": +[ 996 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 996 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1471", "outputIndexes": +[ 997 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 997 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1472", "outputIndexes": +[ 998 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 998, 997 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1473", "outputIndexes": +[ 999 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 989, 999, 992 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_3_output_0", "outputIndexes": +[ 1000 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1000, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Div_1_output_0", "outputIndexes": +[ 1001 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1001, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1002 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 987, 1002, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_3_output_0", "outputIndexes": +[ 1003 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1003 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.10/self_attn/Neg_1_output_0", "outputIndexes": +[ 1004 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1001, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1005 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 987, 20, 1005, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_2_output_0", "outputIndexes": +[ 1006 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1004, 1006 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.10/self_attn/Concat_4_output_0", "outputIndexes": +[ 1007 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1007, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_3_output_0", "outputIndexes": +[ 1008 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 988, 1008 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Add_1_output_0", "outputIndexes": +[ 1009 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3178 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1239320112, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": +[ 3187 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3187 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3188 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3188 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1010 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 949, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1011 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 957, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1012 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1011, 1012, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.10/self_attn/Concat_2_output_0", "outputIndexes": +[ 1013 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1010, 1013 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1014 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 982, 1009, 1014, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.10/self_attn/FusedAttention", "outputIndexes": +[ 1015 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1015 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3189 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3189 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3190 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3190 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1241679430, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": +[ 3191 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3191 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3192 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3192 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1016 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 936, 1016 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/Add_output_0", "outputIndexes": +[ 1017 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1017 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1251116636, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.10/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1018 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1018 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3193 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3193 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3194 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3194 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1251149404, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": +[ 3195 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3195 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3196 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3196 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1019 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1019 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.10/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1020 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3194 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1284179570, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": +[ 3199 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3199 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3200 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3200 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1021 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1020, 1021 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/Mul_output_0", "outputIndexes": +[ 1022 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1022 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3201 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3201 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3202 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3202 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1317209736, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": +[ 3203 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3203 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3204 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3204 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1023 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1017, 1023 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/Add_1_output_0", "outputIndexes": +[ 1024 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1024, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/Reshape_output_0", "outputIndexes": +[ 1025 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1025 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1350239902, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.11/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1026 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1026 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3205 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3205 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3206 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3206 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1350272670, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": +[ 3207 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3207 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3208 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3208 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1027 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1026 ] +, "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_output_0", "outputIndexes": +[ 1028 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1028 ] +, "main_type": "NONE", "name": "Shape1519", "outputIndexes": +[ 1029 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1028 ] +, "main_type": "NONE", "name": "Rank1521", "outputIndexes": +[ 1030 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1030, 1030 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1523", "outputIndexes": +[ 1031 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1031 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1524", "outputIndexes": +[ 1032 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1031, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1526", "outputIndexes": +[ 1033 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1033 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1527", "outputIndexes": +[ 1034 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1029, 1032, 1034, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1530", "outputIndexes": +[ 1035 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1035 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1531", "outputIndexes": +[ 1036 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1036, 1036 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1533", "outputIndexes": +[ 1037 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1028, 1037, 1031 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_output_0", "outputIndexes": +[ 1038 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1038, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1039 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1031 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1541", "outputIndexes": +[ 1040 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1033 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1544", "outputIndexes": +[ 1041 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1029, 1040, 1041, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1547", "outputIndexes": +[ 1042 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1042 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1548", "outputIndexes": +[ 1043 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1043 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1549", "outputIndexes": +[ 1044 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1044, 1043 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1550", "outputIndexes": +[ 1045 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1028, 1045, 1031 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_1_output_0", "outputIndexes": +[ 1046 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1046, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1047 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1039, 1047, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.11/self_attn/Concat_output_0", "outputIndexes": +[ 1048 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1027, 1048 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/self_attn/Reshape_output_0", "outputIndexes": +[ 1049 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1049, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_output_0", "outputIndexes": +[ 1050 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1049 ] +, "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_2_output_0", "outputIndexes": +[ 1051 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1051 ] +, "main_type": "NONE", "name": "Shape1557", "outputIndexes": +[ 1052 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1051 ] +, "main_type": "NONE", "name": "Rank1559", "outputIndexes": +[ 1053 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1053, 1053 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1561", "outputIndexes": +[ 1054 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1054 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1562", "outputIndexes": +[ 1055 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1054, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1564", "outputIndexes": +[ 1056 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1056 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1565", "outputIndexes": +[ 1057 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1052, 1055, 1057, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1568", "outputIndexes": +[ 1058 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1058 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1569", "outputIndexes": +[ 1059 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1059 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1570", "outputIndexes": +[ 1060 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1060, 1059 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1571", "outputIndexes": +[ 1061 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1051, 1061, 1054 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_2_output_0", "outputIndexes": +[ 1062 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1062, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Div_output_0", "outputIndexes": +[ 1063 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1063, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1064 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1049, 1064, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_1_output_0", "outputIndexes": +[ 1065 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1065 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.11/self_attn/Neg_output_0", "outputIndexes": +[ 1066 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1063, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1067 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1049, 20, 1067, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_output_0", "outputIndexes": +[ 1068 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1066, 1068 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.11/self_attn/Concat_3_output_0", "outputIndexes": +[ 1069 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1069, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_1_output_0", "outputIndexes": +[ 1070 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1050, 1070 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Add_output_0", "outputIndexes": +[ 1071 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3206 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1359709876, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": +[ 3211 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3211 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3212 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3212 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1072 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1038, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1073 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1046, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1074 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1073, 1074, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.11/self_attn/Concat_1_output_0", "outputIndexes": +[ 1075 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1072, 1075 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1076 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1076, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_2_output_0", "outputIndexes": +[ 1077 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1076 ] +, "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_3_output_0", "outputIndexes": +[ 1078 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1078 ] +, "main_type": "NONE", "name": "Shape1590", "outputIndexes": +[ 1079 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1078 ] +, "main_type": "NONE", "name": "Rank1592", "outputIndexes": +[ 1080 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1080, 1080 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1594", "outputIndexes": +[ 1081 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1081 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1595", "outputIndexes": +[ 1082 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1081, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1597", "outputIndexes": +[ 1083 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1083 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1598", "outputIndexes": +[ 1084 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1079, 1082, 1084, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1601", "outputIndexes": +[ 1085 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1085 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1602", "outputIndexes": +[ 1086 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1086 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1603", "outputIndexes": +[ 1087 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1087, 1086 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1604", "outputIndexes": +[ 1088 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1078, 1088, 1081 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_3_output_0", "outputIndexes": +[ 1089 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1089, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Div_1_output_0", "outputIndexes": +[ 1090 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1090, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1091 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1076, 1091, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_3_output_0", "outputIndexes": +[ 1092 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1092 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.11/self_attn/Neg_1_output_0", "outputIndexes": +[ 1093 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1090, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1094 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1076, 20, 1094, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_2_output_0", "outputIndexes": +[ 1095 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1093, 1095 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.11/self_attn/Concat_4_output_0", "outputIndexes": +[ 1096 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1096, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_3_output_0", "outputIndexes": +[ 1097 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1077, 1097 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Add_1_output_0", "outputIndexes": +[ 1098 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3206 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1362069194, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": +[ 3215 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3215 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3216 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3216 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1099 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1038, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1100 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1046, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1101 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1100, 1101, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.11/self_attn/Concat_2_output_0", "outputIndexes": +[ 1102 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1099, 1102 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1103 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1071, 1098, 1103, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.11/self_attn/FusedAttention", "outputIndexes": +[ 1104 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1104 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3217 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3217 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3218 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3218 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1364428512, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": +[ 3219 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3219 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3220 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3220 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1105 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1025, 1105 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/Add_output_0", "outputIndexes": +[ 1106 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1106 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1373865718, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.11/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1107 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1107 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3221 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3221 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3222 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3222 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1373898486, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": +[ 3223 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3223 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3224 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3224 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1108 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1108 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.11/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1109 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3222 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1406928652, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": +[ 3227 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3227 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3228 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3228 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1110 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1109, 1110 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/Mul_output_0", "outputIndexes": +[ 1111 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1111 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3229 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3229 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3230 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3230 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1439958818, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": +[ 3231 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3231 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3232 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3232 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1112 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1106, 1112 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/Add_1_output_0", "outputIndexes": +[ 1113 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1113, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/Reshape_output_0", "outputIndexes": +[ 1114 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1114 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1472988984, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.12/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1115 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1115 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3233 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3233 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3234 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3234 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1473021752, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": +[ 3235 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3235 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3236 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3236 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1116 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1115 ] +, "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_output_0", "outputIndexes": +[ 1117 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1117 ] +, "main_type": "NONE", "name": "Shape1650", "outputIndexes": +[ 1118 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1117 ] +, "main_type": "NONE", "name": "Rank1652", "outputIndexes": +[ 1119 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1119, 1119 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1654", "outputIndexes": +[ 1120 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1120 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1655", "outputIndexes": +[ 1121 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1120, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1657", "outputIndexes": +[ 1122 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1122 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1658", "outputIndexes": +[ 1123 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1118, 1121, 1123, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1661", "outputIndexes": +[ 1124 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1124 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1662", "outputIndexes": +[ 1125 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1125, 1125 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1664", "outputIndexes": +[ 1126 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1117, 1126, 1120 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_output_0", "outputIndexes": +[ 1127 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1127, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1128 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1120 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1672", "outputIndexes": +[ 1129 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1122 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1675", "outputIndexes": +[ 1130 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1118, 1129, 1130, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1678", "outputIndexes": +[ 1131 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1131 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1679", "outputIndexes": +[ 1132 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1132 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1680", "outputIndexes": +[ 1133 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1133, 1132 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1681", "outputIndexes": +[ 1134 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1117, 1134, 1120 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_1_output_0", "outputIndexes": +[ 1135 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1135, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1136 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1128, 1136, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.12/self_attn/Concat_output_0", "outputIndexes": +[ 1137 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1116, 1137 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/self_attn/Reshape_output_0", "outputIndexes": +[ 1138 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1138, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_output_0", "outputIndexes": +[ 1139 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1138 ] +, "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_2_output_0", "outputIndexes": +[ 1140 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1140 ] +, "main_type": "NONE", "name": "Shape1688", "outputIndexes": +[ 1141 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1140 ] +, "main_type": "NONE", "name": "Rank1690", "outputIndexes": +[ 1142 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1142, 1142 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1692", "outputIndexes": +[ 1143 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1143 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1693", "outputIndexes": +[ 1144 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1143, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1695", "outputIndexes": +[ 1145 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1145 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1696", "outputIndexes": +[ 1146 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1141, 1144, 1146, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1699", "outputIndexes": +[ 1147 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1147 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1700", "outputIndexes": +[ 1148 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1148 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1701", "outputIndexes": +[ 1149 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1149, 1148 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1702", "outputIndexes": +[ 1150 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1140, 1150, 1143 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_2_output_0", "outputIndexes": +[ 1151 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1151, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Div_output_0", "outputIndexes": +[ 1152 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1152, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1153 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1138, 1153, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_1_output_0", "outputIndexes": +[ 1154 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1154 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.12/self_attn/Neg_output_0", "outputIndexes": +[ 1155 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1152, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1156 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1138, 20, 1156, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_output_0", "outputIndexes": +[ 1157 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1155, 1157 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.12/self_attn/Concat_3_output_0", "outputIndexes": +[ 1158 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1158, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_1_output_0", "outputIndexes": +[ 1159 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1139, 1159 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Add_output_0", "outputIndexes": +[ 1160 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3234 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1482458958, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": +[ 3239 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3239 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3240 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3240 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1161 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1127, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1162 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1135, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1163 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1162, 1163, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.12/self_attn/Concat_1_output_0", "outputIndexes": +[ 1164 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1161, 1164 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1165 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1165, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_2_output_0", "outputIndexes": +[ 1166 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1165 ] +, "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_3_output_0", "outputIndexes": +[ 1167 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1167 ] +, "main_type": "NONE", "name": "Shape1721", "outputIndexes": +[ 1168 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1167 ] +, "main_type": "NONE", "name": "Rank1723", "outputIndexes": +[ 1169 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1169, 1169 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1725", "outputIndexes": +[ 1170 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1170 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1726", "outputIndexes": +[ 1171 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1170, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1728", "outputIndexes": +[ 1172 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1172 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1729", "outputIndexes": +[ 1173 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1168, 1171, 1173, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1732", "outputIndexes": +[ 1174 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1174 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1733", "outputIndexes": +[ 1175 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1175 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1734", "outputIndexes": +[ 1176 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1176, 1175 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1735", "outputIndexes": +[ 1177 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1167, 1177, 1170 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_3_output_0", "outputIndexes": +[ 1178 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1178, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Div_1_output_0", "outputIndexes": +[ 1179 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1179, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1180 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1165, 1180, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_3_output_0", "outputIndexes": +[ 1181 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1181 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.12/self_attn/Neg_1_output_0", "outputIndexes": +[ 1182 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1179, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1183 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1165, 20, 1183, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_2_output_0", "outputIndexes": +[ 1184 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1182, 1184 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.12/self_attn/Concat_4_output_0", "outputIndexes": +[ 1185 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1185, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_3_output_0", "outputIndexes": +[ 1186 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1166, 1186 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Add_1_output_0", "outputIndexes": +[ 1187 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3234 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1484818276, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": +[ 3243 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3243 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3244 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3244 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1188 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1127, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1189 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1135, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1190 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1189, 1190, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.12/self_attn/Concat_2_output_0", "outputIndexes": +[ 1191 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1188, 1191 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1192 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1160, 1187, 1192, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.12/self_attn/FusedAttention", "outputIndexes": +[ 1193 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1193 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3245 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3245 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3246 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3246 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1487177594, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": +[ 3247 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3247 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3248 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3248 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1194 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1114, 1194 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/Add_output_0", "outputIndexes": +[ 1195 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1195 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1496614800, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.12/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1196 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1196 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3249 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3249 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3250 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3250 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1496647568, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": +[ 3251 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3251 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3252 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3252 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1197 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1197 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.12/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1198 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3250 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1529677734, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": +[ 3255 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3255 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3256 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3256 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1199 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1198, 1199 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/Mul_output_0", "outputIndexes": +[ 1200 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1200 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3257 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3257 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3258 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3258 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1562707900, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": +[ 3259 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3259 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3260 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3260 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1201 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1195, 1201 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/Add_1_output_0", "outputIndexes": +[ 1202 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1202, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/Reshape_output_0", "outputIndexes": +[ 1203 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1203 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1595738066, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.13/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1204 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1204 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3261 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3261 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3262 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3262 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1595770834, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": +[ 3263 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3263 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3264 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3264 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1205 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1204 ] +, "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_output_0", "outputIndexes": +[ 1206 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1206 ] +, "main_type": "NONE", "name": "Shape1781", "outputIndexes": +[ 1207 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1206 ] +, "main_type": "NONE", "name": "Rank1783", "outputIndexes": +[ 1208 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1208, 1208 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1785", "outputIndexes": +[ 1209 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1209 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1786", "outputIndexes": +[ 1210 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1209, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1788", "outputIndexes": +[ 1211 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1211 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1789", "outputIndexes": +[ 1212 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1207, 1210, 1212, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1792", "outputIndexes": +[ 1213 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1213 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1793", "outputIndexes": +[ 1214 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1214, 1214 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1795", "outputIndexes": +[ 1215 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1206, 1215, 1209 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_output_0", "outputIndexes": +[ 1216 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1216, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1217 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1209 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1803", "outputIndexes": +[ 1218 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1211 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1806", "outputIndexes": +[ 1219 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1207, 1218, 1219, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1809", "outputIndexes": +[ 1220 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1220 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1810", "outputIndexes": +[ 1221 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1221 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1811", "outputIndexes": +[ 1222 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1222, 1221 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1812", "outputIndexes": +[ 1223 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1206, 1223, 1209 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_1_output_0", "outputIndexes": +[ 1224 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1224, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1225 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1217, 1225, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.13/self_attn/Concat_output_0", "outputIndexes": +[ 1226 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1205, 1226 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/self_attn/Reshape_output_0", "outputIndexes": +[ 1227 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1227, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_output_0", "outputIndexes": +[ 1228 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1227 ] +, "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_2_output_0", "outputIndexes": +[ 1229 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1229 ] +, "main_type": "NONE", "name": "Shape1819", "outputIndexes": +[ 1230 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1229 ] +, "main_type": "NONE", "name": "Rank1821", "outputIndexes": +[ 1231 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1231, 1231 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1823", "outputIndexes": +[ 1232 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1232 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1824", "outputIndexes": +[ 1233 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1232, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1826", "outputIndexes": +[ 1234 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1234 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1827", "outputIndexes": +[ 1235 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1230, 1233, 1235, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1830", "outputIndexes": +[ 1236 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1236 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1831", "outputIndexes": +[ 1237 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1237 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1832", "outputIndexes": +[ 1238 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1238, 1237 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1833", "outputIndexes": +[ 1239 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1229, 1239, 1232 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_2_output_0", "outputIndexes": +[ 1240 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1240, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Div_output_0", "outputIndexes": +[ 1241 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1241, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1242 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1227, 1242, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_1_output_0", "outputIndexes": +[ 1243 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1243 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.13/self_attn/Neg_output_0", "outputIndexes": +[ 1244 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1241, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1245 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1227, 20, 1245, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_output_0", "outputIndexes": +[ 1246 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1244, 1246 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.13/self_attn/Concat_3_output_0", "outputIndexes": +[ 1247 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1247, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_1_output_0", "outputIndexes": +[ 1248 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1228, 1248 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Add_output_0", "outputIndexes": +[ 1249 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3262 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1605208040, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": +[ 3267 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3267 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3268 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3268 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1250 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1216, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1251 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1224, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1252 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1251, 1252, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.13/self_attn/Concat_1_output_0", "outputIndexes": +[ 1253 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1250, 1253 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1254 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1254, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_2_output_0", "outputIndexes": +[ 1255 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1254 ] +, "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_3_output_0", "outputIndexes": +[ 1256 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1256 ] +, "main_type": "NONE", "name": "Shape1852", "outputIndexes": +[ 1257 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1256 ] +, "main_type": "NONE", "name": "Rank1854", "outputIndexes": +[ 1258 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1258, 1258 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1856", "outputIndexes": +[ 1259 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1259 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1857", "outputIndexes": +[ 1260 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1259, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1859", "outputIndexes": +[ 1261 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1261 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1860", "outputIndexes": +[ 1262 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1257, 1260, 1262, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1863", "outputIndexes": +[ 1263 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1263 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1864", "outputIndexes": +[ 1264 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1264 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1865", "outputIndexes": +[ 1265 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1265, 1264 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1866", "outputIndexes": +[ 1266 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1256, 1266, 1259 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_3_output_0", "outputIndexes": +[ 1267 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1267, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Div_1_output_0", "outputIndexes": +[ 1268 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1268, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1269 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1254, 1269, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_3_output_0", "outputIndexes": +[ 1270 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1270 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.13/self_attn/Neg_1_output_0", "outputIndexes": +[ 1271 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1268, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1272 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1254, 20, 1272, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_2_output_0", "outputIndexes": +[ 1273 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1271, 1273 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.13/self_attn/Concat_4_output_0", "outputIndexes": +[ 1274 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1274, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_3_output_0", "outputIndexes": +[ 1275 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1255, 1275 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Add_1_output_0", "outputIndexes": +[ 1276 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3262 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1607567358, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": +[ 3271 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3271 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3272 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3272 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1277 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1216, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1278 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1224, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1279 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1278, 1279, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.13/self_attn/Concat_2_output_0", "outputIndexes": +[ 1280 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1277, 1280 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1281 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1249, 1276, 1281, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.13/self_attn/FusedAttention", "outputIndexes": +[ 1282 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1282 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3273 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3273 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3274 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3274 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1609926676, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": +[ 3275 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3275 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3276 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3276 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1283 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1203, 1283 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/Add_output_0", "outputIndexes": +[ 1284 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1284 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1619363882, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.13/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1285 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1285 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3277 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3277 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3278 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3278 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1619396650, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": +[ 3279 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3279 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3280 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3280 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1286 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1286 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.13/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1287 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3278 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1652426816, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": +[ 3283 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3283 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3284 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3284 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1288 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1287, 1288 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/Mul_output_0", "outputIndexes": +[ 1289 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1289 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3285 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3285 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3286 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3286 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1685456982, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": +[ 3287 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3287 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3288 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3288 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1290 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1284, 1290 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/Add_1_output_0", "outputIndexes": +[ 1291 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1291, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/Reshape_output_0", "outputIndexes": +[ 1292 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1292 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1718487148, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.14/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1293 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1293 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3289 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3289 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3290 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3290 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1718519916, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": +[ 3291 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3291 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3292 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3292 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1294 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1293 ] +, "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_output_0", "outputIndexes": +[ 1295 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1295 ] +, "main_type": "NONE", "name": "Shape1912", "outputIndexes": +[ 1296 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1295 ] +, "main_type": "NONE", "name": "Rank1914", "outputIndexes": +[ 1297 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1297, 1297 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1916", "outputIndexes": +[ 1298 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1298 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1917", "outputIndexes": +[ 1299 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1298, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1919", "outputIndexes": +[ 1300 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1300 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1920", "outputIndexes": +[ 1301 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1296, 1299, 1301, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1923", "outputIndexes": +[ 1302 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1302 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1924", "outputIndexes": +[ 1303 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1303, 1303 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1926", "outputIndexes": +[ 1304 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1295, 1304, 1298 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_output_0", "outputIndexes": +[ 1305 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1305, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1306 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1298 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1934", "outputIndexes": +[ 1307 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1300 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1937", "outputIndexes": +[ 1308 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1296, 1307, 1308, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1940", "outputIndexes": +[ 1309 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1309 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1941", "outputIndexes": +[ 1310 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1310 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1942", "outputIndexes": +[ 1311 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1311, 1310 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1943", "outputIndexes": +[ 1312 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1295, 1312, 1298 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_1_output_0", "outputIndexes": +[ 1313 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1313, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1314 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1306, 1314, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.14/self_attn/Concat_output_0", "outputIndexes": +[ 1315 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1294, 1315 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/self_attn/Reshape_output_0", "outputIndexes": +[ 1316 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1316, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_output_0", "outputIndexes": +[ 1317 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1316 ] +, "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_2_output_0", "outputIndexes": +[ 1318 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1318 ] +, "main_type": "NONE", "name": "Shape1950", "outputIndexes": +[ 1319 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1318 ] +, "main_type": "NONE", "name": "Rank1952", "outputIndexes": +[ 1320 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1320, 1320 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1954", "outputIndexes": +[ 1321 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1321 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1955", "outputIndexes": +[ 1322 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1321, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1957", "outputIndexes": +[ 1323 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1323 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1958", "outputIndexes": +[ 1324 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1319, 1322, 1324, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1961", "outputIndexes": +[ 1325 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1325 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1962", "outputIndexes": +[ 1326 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1326 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1963", "outputIndexes": +[ 1327 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1327, 1326 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1964", "outputIndexes": +[ 1328 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1318, 1328, 1321 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_2_output_0", "outputIndexes": +[ 1329 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1329, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Div_output_0", "outputIndexes": +[ 1330 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1330, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1331 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1316, 1331, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_1_output_0", "outputIndexes": +[ 1332 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1332 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.14/self_attn/Neg_output_0", "outputIndexes": +[ 1333 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1330, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1334 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1316, 20, 1334, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_output_0", "outputIndexes": +[ 1335 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1333, 1335 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.14/self_attn/Concat_3_output_0", "outputIndexes": +[ 1336 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1336, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_1_output_0", "outputIndexes": +[ 1337 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1317, 1337 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Add_output_0", "outputIndexes": +[ 1338 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3290 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1727957122, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": +[ 3295 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3295 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3296 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3296 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1339 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1305, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1340 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1313, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1341 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1340, 1341, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.14/self_attn/Concat_1_output_0", "outputIndexes": +[ 1342 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1339, 1342 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1343 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_2_output_0", "outputIndexes": +[ 1344 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343 ] +, "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_3_output_0", "outputIndexes": +[ 1345 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1345 ] +, "main_type": "NONE", "name": "Shape1983", "outputIndexes": +[ 1346 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1345 ] +, "main_type": "NONE", "name": "Rank1985", "outputIndexes": +[ 1347 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1347, 1347 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1987", "outputIndexes": +[ 1348 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1348 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1988", "outputIndexes": +[ 1349 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1348, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1990", "outputIndexes": +[ 1350 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1350 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1991", "outputIndexes": +[ 1351 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1346, 1349, 1351, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1994", "outputIndexes": +[ 1352 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1352 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1995", "outputIndexes": +[ 1353 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1353 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1996", "outputIndexes": +[ 1354 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1354, 1353 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1997", "outputIndexes": +[ 1355 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1345, 1355, 1348 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_3_output_0", "outputIndexes": +[ 1356 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1356, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Div_1_output_0", "outputIndexes": +[ 1357 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1357, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1358 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343, 1358, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_3_output_0", "outputIndexes": +[ 1359 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1359 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.14/self_attn/Neg_1_output_0", "outputIndexes": +[ 1360 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1357, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1361 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343, 20, 1361, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_2_output_0", "outputIndexes": +[ 1362 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1360, 1362 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.14/self_attn/Concat_4_output_0", "outputIndexes": +[ 1363 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1363, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_3_output_0", "outputIndexes": +[ 1364 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1344, 1364 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Add_1_output_0", "outputIndexes": +[ 1365 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3290 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1730316440, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": +[ 3299 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3299 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3300 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3300 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1366 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1305, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1367 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1313, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1368 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1367, 1368, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.14/self_attn/Concat_2_output_0", "outputIndexes": +[ 1369 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1366, 1369 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1370 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1338, 1365, 1370, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.14/self_attn/FusedAttention", "outputIndexes": +[ 1371 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1371 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3301 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3301 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3302 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3302 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1732675758, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": +[ 3303 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3303 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3304 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3304 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1372 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1292, 1372 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/Add_output_0", "outputIndexes": +[ 1373 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1373 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1742112964, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.14/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1374 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1374 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3305 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3305 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3306 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3306 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1742145732, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": +[ 3307 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3307 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3308 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3308 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1375 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1375 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.14/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1376 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3306 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1775175898, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": +[ 3311 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3311 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3312 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3312 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1377 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1376, 1377 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/Mul_output_0", "outputIndexes": +[ 1378 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1378 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3313 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3313 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3314 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3314 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1808206064, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": +[ 3315 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3315 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3316 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3316 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1379 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1373, 1379 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/Add_1_output_0", "outputIndexes": +[ 1380 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1380, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/Reshape_output_0", "outputIndexes": +[ 1381 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1381 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1841236230, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.15/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1382 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1382 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3317 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3317 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3318 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3318 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1841268998, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": +[ 3319 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3319 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3320 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3320 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1383 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1382 ] +, "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_output_0", "outputIndexes": +[ 1384 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1384 ] +, "main_type": "NONE", "name": "Shape2043", "outputIndexes": +[ 1385 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1384 ] +, "main_type": "NONE", "name": "Rank2045", "outputIndexes": +[ 1386 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1386, 1386 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2047", "outputIndexes": +[ 1387 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1387 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2048", "outputIndexes": +[ 1388 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1387, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2050", "outputIndexes": +[ 1389 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1389 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2051", "outputIndexes": +[ 1390 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1385, 1388, 1390, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2054", "outputIndexes": +[ 1391 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1391 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2055", "outputIndexes": +[ 1392 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1392, 1392 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2057", "outputIndexes": +[ 1393 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1384, 1393, 1387 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_output_0", "outputIndexes": +[ 1394 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1394, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1395 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1387 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2065", "outputIndexes": +[ 1396 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1389 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2068", "outputIndexes": +[ 1397 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1385, 1396, 1397, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2071", "outputIndexes": +[ 1398 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1398 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2072", "outputIndexes": +[ 1399 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1399 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2073", "outputIndexes": +[ 1400 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1400, 1399 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2074", "outputIndexes": +[ 1401 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1384, 1401, 1387 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_1_output_0", "outputIndexes": +[ 1402 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1402, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1403 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1395, 1403, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.15/self_attn/Concat_output_0", "outputIndexes": +[ 1404 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1383, 1404 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/self_attn/Reshape_output_0", "outputIndexes": +[ 1405 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_output_0", "outputIndexes": +[ 1406 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405 ] +, "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_2_output_0", "outputIndexes": +[ 1407 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1407 ] +, "main_type": "NONE", "name": "Shape2081", "outputIndexes": +[ 1408 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1407 ] +, "main_type": "NONE", "name": "Rank2083", "outputIndexes": +[ 1409 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1409, 1409 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2085", "outputIndexes": +[ 1410 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1410 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2086", "outputIndexes": +[ 1411 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1410, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2088", "outputIndexes": +[ 1412 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1412 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2089", "outputIndexes": +[ 1413 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1408, 1411, 1413, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2092", "outputIndexes": +[ 1414 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1414 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2093", "outputIndexes": +[ 1415 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1415 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2094", "outputIndexes": +[ 1416 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1416, 1415 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2095", "outputIndexes": +[ 1417 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1407, 1417, 1410 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_2_output_0", "outputIndexes": +[ 1418 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1418, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Div_output_0", "outputIndexes": +[ 1419 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1419, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1420 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405, 1420, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_1_output_0", "outputIndexes": +[ 1421 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1421 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.15/self_attn/Neg_output_0", "outputIndexes": +[ 1422 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1419, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1423 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405, 20, 1423, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_output_0", "outputIndexes": +[ 1424 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1422, 1424 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.15/self_attn/Concat_3_output_0", "outputIndexes": +[ 1425 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1425, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_1_output_0", "outputIndexes": +[ 1426 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1406, 1426 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Add_output_0", "outputIndexes": +[ 1427 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3318 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1850706204, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": +[ 3323 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3323 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3324 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3324 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1428 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1394, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1429 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1402, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1430 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1429, 1430, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.15/self_attn/Concat_1_output_0", "outputIndexes": +[ 1431 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1428, 1431 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1432 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1432, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_2_output_0", "outputIndexes": +[ 1433 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1432 ] +, "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_3_output_0", "outputIndexes": +[ 1434 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1434 ] +, "main_type": "NONE", "name": "Shape2114", "outputIndexes": +[ 1435 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1434 ] +, "main_type": "NONE", "name": "Rank2116", "outputIndexes": +[ 1436 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1436, 1436 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2118", "outputIndexes": +[ 1437 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1437 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2119", "outputIndexes": +[ 1438 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1437, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2121", "outputIndexes": +[ 1439 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1439 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2122", "outputIndexes": +[ 1440 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1435, 1438, 1440, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2125", "outputIndexes": +[ 1441 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1441 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2126", "outputIndexes": +[ 1442 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1442 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2127", "outputIndexes": +[ 1443 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1443, 1442 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2128", "outputIndexes": +[ 1444 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1434, 1444, 1437 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_3_output_0", "outputIndexes": +[ 1445 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1445, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Div_1_output_0", "outputIndexes": +[ 1446 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1446, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1447 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1432, 1447, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_3_output_0", "outputIndexes": +[ 1448 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1448 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.15/self_attn/Neg_1_output_0", "outputIndexes": +[ 1449 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1446, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1450 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1432, 20, 1450, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_2_output_0", "outputIndexes": +[ 1451 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1449, 1451 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.15/self_attn/Concat_4_output_0", "outputIndexes": +[ 1452 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1452, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_3_output_0", "outputIndexes": +[ 1453 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1433, 1453 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Add_1_output_0", "outputIndexes": +[ 1454 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3318 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1853065522, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": +[ 3327 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3327 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3328 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3328 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1455 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1394, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1456 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1402, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1457 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1456, 1457, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.15/self_attn/Concat_2_output_0", "outputIndexes": +[ 1458 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1455, 1458 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1459 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1427, 1454, 1459, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.15/self_attn/FusedAttention", "outputIndexes": +[ 1460 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1460 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3329 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3329 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3330 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3330 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1855424840, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": +[ 3331 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3331 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3332 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3332 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1461 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1381, 1461 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/Add_output_0", "outputIndexes": +[ 1462 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1462 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1864862046, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.15/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1463 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1463 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3333 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3333 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3334 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3334 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1864894814, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": +[ 3335 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3335 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3336 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3336 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1464 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1464 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.15/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1465 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3334 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1897924980, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": +[ 3339 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3339 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3340 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3340 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1466 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1465, 1466 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/Mul_output_0", "outputIndexes": +[ 1467 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1467 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3341 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3341 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3342 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3342 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1930955146, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": +[ 3343 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3343 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3344 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3344 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1468 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1462, 1468 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/Add_1_output_0", "outputIndexes": +[ 1469 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1469, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/Reshape_output_0", "outputIndexes": +[ 1470 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1470 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1963985312, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.16/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1471 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1471 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3345 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3345 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3346 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3346 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1964018080, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": +[ 3347 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3347 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3348 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3348 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1472 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1471 ] +, "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_output_0", "outputIndexes": +[ 1473 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1473 ] +, "main_type": "NONE", "name": "Shape2174", "outputIndexes": +[ 1474 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1473 ] +, "main_type": "NONE", "name": "Rank2176", "outputIndexes": +[ 1475 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1475, 1475 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2178", "outputIndexes": +[ 1476 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1476 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2179", "outputIndexes": +[ 1477 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1476, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2181", "outputIndexes": +[ 1478 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1478 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2182", "outputIndexes": +[ 1479 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1474, 1477, 1479, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2185", "outputIndexes": +[ 1480 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1480 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2186", "outputIndexes": +[ 1481 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1481, 1481 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2188", "outputIndexes": +[ 1482 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1473, 1482, 1476 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_output_0", "outputIndexes": +[ 1483 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1483, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1484 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1476 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2196", "outputIndexes": +[ 1485 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1478 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2199", "outputIndexes": +[ 1486 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1474, 1485, 1486, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2202", "outputIndexes": +[ 1487 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1487 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2203", "outputIndexes": +[ 1488 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1488 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2204", "outputIndexes": +[ 1489 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1489, 1488 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2205", "outputIndexes": +[ 1490 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1473, 1490, 1476 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_1_output_0", "outputIndexes": +[ 1491 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1491, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1492 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1484, 1492, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.16/self_attn/Concat_output_0", "outputIndexes": +[ 1493 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1472, 1493 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/self_attn/Reshape_output_0", "outputIndexes": +[ 1494 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1494, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_output_0", "outputIndexes": +[ 1495 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1494 ] +, "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_2_output_0", "outputIndexes": +[ 1496 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1496 ] +, "main_type": "NONE", "name": "Shape2212", "outputIndexes": +[ 1497 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1496 ] +, "main_type": "NONE", "name": "Rank2214", "outputIndexes": +[ 1498 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1498, 1498 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2216", "outputIndexes": +[ 1499 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1499 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2217", "outputIndexes": +[ 1500 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1499, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2219", "outputIndexes": +[ 1501 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1501 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2220", "outputIndexes": +[ 1502 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1497, 1500, 1502, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2223", "outputIndexes": +[ 1503 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1503 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2224", "outputIndexes": +[ 1504 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1504 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2225", "outputIndexes": +[ 1505 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1505, 1504 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2226", "outputIndexes": +[ 1506 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1496, 1506, 1499 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_2_output_0", "outputIndexes": +[ 1507 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1507, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Div_output_0", "outputIndexes": +[ 1508 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1508, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1509 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1494, 1509, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_1_output_0", "outputIndexes": +[ 1510 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1510 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.16/self_attn/Neg_output_0", "outputIndexes": +[ 1511 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1508, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1512 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1494, 20, 1512, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_output_0", "outputIndexes": +[ 1513 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1511, 1513 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.16/self_attn/Concat_3_output_0", "outputIndexes": +[ 1514 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1514, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_1_output_0", "outputIndexes": +[ 1515 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1495, 1515 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Add_output_0", "outputIndexes": +[ 1516 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3346 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1973455286, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": +[ 3351 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3351 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3352 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3352 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1517 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1483, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1518 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1491, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1519 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1518, 1519, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.16/self_attn/Concat_1_output_0", "outputIndexes": +[ 1520 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1517, 1520 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1521 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1521, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_2_output_0", "outputIndexes": +[ 1522 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1521 ] +, "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_3_output_0", "outputIndexes": +[ 1523 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1523 ] +, "main_type": "NONE", "name": "Shape2245", "outputIndexes": +[ 1524 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1523 ] +, "main_type": "NONE", "name": "Rank2247", "outputIndexes": +[ 1525 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1525, 1525 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2249", "outputIndexes": +[ 1526 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1526 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2250", "outputIndexes": +[ 1527 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1526, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2252", "outputIndexes": +[ 1528 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1528 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2253", "outputIndexes": +[ 1529 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1524, 1527, 1529, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2256", "outputIndexes": +[ 1530 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1530 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2257", "outputIndexes": +[ 1531 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1531 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2258", "outputIndexes": +[ 1532 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1532, 1531 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2259", "outputIndexes": +[ 1533 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1523, 1533, 1526 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_3_output_0", "outputIndexes": +[ 1534 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1534, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Div_1_output_0", "outputIndexes": +[ 1535 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1535, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1536 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1521, 1536, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_3_output_0", "outputIndexes": +[ 1537 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1537 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.16/self_attn/Neg_1_output_0", "outputIndexes": +[ 1538 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1535, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1539 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1521, 20, 1539, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_2_output_0", "outputIndexes": +[ 1540 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1538, 1540 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.16/self_attn/Concat_4_output_0", "outputIndexes": +[ 1541 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1541, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_3_output_0", "outputIndexes": +[ 1542 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1522, 1542 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Add_1_output_0", "outputIndexes": +[ 1543 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3346 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1975814604, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": +[ 3355 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3355 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3356 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3356 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1544 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1483, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1545 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1491, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1546 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1545, 1546, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.16/self_attn/Concat_2_output_0", "outputIndexes": +[ 1547 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1544, 1547 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1548 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1516, 1543, 1548, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.16/self_attn/FusedAttention", "outputIndexes": +[ 1549 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1549 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3357 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3357 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3358 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3358 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1978173922, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": +[ 3359 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3359 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3360 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3360 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1550 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1470, 1550 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/Add_output_0", "outputIndexes": +[ 1551 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1551 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 1987611128, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.16/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1552 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1552 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3361 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3361 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3362 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3362 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1987643896, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": +[ 3363 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3363 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3364 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3364 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1553 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1553 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.16/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1554 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3362 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2020674062, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": +[ 3367 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3367 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3368 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3368 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1555 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1554, 1555 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/Mul_output_0", "outputIndexes": +[ 1556 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1556 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3369 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3369 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3370 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3370 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2053704228, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": +[ 3371 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3371 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3372 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3372 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1557 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1551, 1557 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/Add_1_output_0", "outputIndexes": +[ 1558 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1558, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/Reshape_output_0", "outputIndexes": +[ 1559 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1559 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2086734394, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.17/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1560 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1560 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3373 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3373 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3374 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3374 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2086767162, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": +[ 3375 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3375 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3376 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3376 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1561 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1560 ] +, "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_output_0", "outputIndexes": +[ 1562 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1562 ] +, "main_type": "NONE", "name": "Shape2305", "outputIndexes": +[ 1563 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1562 ] +, "main_type": "NONE", "name": "Rank2307", "outputIndexes": +[ 1564 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1564, 1564 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2309", "outputIndexes": +[ 1565 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1565 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2310", "outputIndexes": +[ 1566 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1565, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2312", "outputIndexes": +[ 1567 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1567 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2313", "outputIndexes": +[ 1568 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1563, 1566, 1568, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2316", "outputIndexes": +[ 1569 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1569 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2317", "outputIndexes": +[ 1570 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1570, 1570 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2319", "outputIndexes": +[ 1571 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1562, 1571, 1565 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_output_0", "outputIndexes": +[ 1572 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1572, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1573 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1565 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2327", "outputIndexes": +[ 1574 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1567 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2330", "outputIndexes": +[ 1575 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1563, 1574, 1575, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2333", "outputIndexes": +[ 1576 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1576 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2334", "outputIndexes": +[ 1577 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1577 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2335", "outputIndexes": +[ 1578 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1578, 1577 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2336", "outputIndexes": +[ 1579 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1562, 1579, 1565 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_1_output_0", "outputIndexes": +[ 1580 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1580, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1581 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1573, 1581, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.17/self_attn/Concat_output_0", "outputIndexes": +[ 1582 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1561, 1582 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/self_attn/Reshape_output_0", "outputIndexes": +[ 1583 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1583, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_output_0", "outputIndexes": +[ 1584 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1583 ] +, "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_2_output_0", "outputIndexes": +[ 1585 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1585 ] +, "main_type": "NONE", "name": "Shape2343", "outputIndexes": +[ 1586 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1585 ] +, "main_type": "NONE", "name": "Rank2345", "outputIndexes": +[ 1587 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1587, 1587 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2347", "outputIndexes": +[ 1588 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1588 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2348", "outputIndexes": +[ 1589 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1588, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2350", "outputIndexes": +[ 1590 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1590 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2351", "outputIndexes": +[ 1591 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1586, 1589, 1591, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2354", "outputIndexes": +[ 1592 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1592 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2355", "outputIndexes": +[ 1593 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1593 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2356", "outputIndexes": +[ 1594 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1594, 1593 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2357", "outputIndexes": +[ 1595 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1585, 1595, 1588 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_2_output_0", "outputIndexes": +[ 1596 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1596, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Div_output_0", "outputIndexes": +[ 1597 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1597, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1598 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1583, 1598, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_1_output_0", "outputIndexes": +[ 1599 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1599 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.17/self_attn/Neg_output_0", "outputIndexes": +[ 1600 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1597, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1601 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1583, 20, 1601, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_output_0", "outputIndexes": +[ 1602 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1600, 1602 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.17/self_attn/Concat_3_output_0", "outputIndexes": +[ 1603 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1603, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_1_output_0", "outputIndexes": +[ 1604 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1584, 1604 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Add_output_0", "outputIndexes": +[ 1605 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3374 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2096204368, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": +[ 3379 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3379 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3380 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3380 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1606 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1572, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1607 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1580, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1608 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1607, 1608, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.17/self_attn/Concat_1_output_0", "outputIndexes": +[ 1609 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1606, 1609 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1610 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1610, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_2_output_0", "outputIndexes": +[ 1611 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1610 ] +, "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_3_output_0", "outputIndexes": +[ 1612 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1612 ] +, "main_type": "NONE", "name": "Shape2376", "outputIndexes": +[ 1613 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1612 ] +, "main_type": "NONE", "name": "Rank2378", "outputIndexes": +[ 1614 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1614, 1614 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2380", "outputIndexes": +[ 1615 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1615 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2381", "outputIndexes": +[ 1616 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1615, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2383", "outputIndexes": +[ 1617 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1617 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2384", "outputIndexes": +[ 1618 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1613, 1616, 1618, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2387", "outputIndexes": +[ 1619 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1619 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2388", "outputIndexes": +[ 1620 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1620 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2389", "outputIndexes": +[ 1621 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1621, 1620 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2390", "outputIndexes": +[ 1622 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1612, 1622, 1615 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_3_output_0", "outputIndexes": +[ 1623 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1623, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Div_1_output_0", "outputIndexes": +[ 1624 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1624, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1625 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1610, 1625, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_3_output_0", "outputIndexes": +[ 1626 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1626 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.17/self_attn/Neg_1_output_0", "outputIndexes": +[ 1627 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1624, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1628 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1610, 20, 1628, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_2_output_0", "outputIndexes": +[ 1629 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1627, 1629 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.17/self_attn/Concat_4_output_0", "outputIndexes": +[ 1630 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1630, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_3_output_0", "outputIndexes": +[ 1631 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1611, 1631 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Add_1_output_0", "outputIndexes": +[ 1632 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3374 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2098563686, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": +[ 3383 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3383 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3384 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3384 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1633 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1572, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1634 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1580, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1635 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1634, 1635, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.17/self_attn/Concat_2_output_0", "outputIndexes": +[ 1636 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1633, 1636 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1637 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1605, 1632, 1637, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.17/self_attn/FusedAttention", "outputIndexes": +[ 1638 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1638 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3385 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3385 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3386 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3386 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2100923004, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": +[ 3387 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3387 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3388 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3388 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1639 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1559, 1639 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/Add_output_0", "outputIndexes": +[ 1640 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1640 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2110360210, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.17/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1641 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1641 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3389 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3389 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3390 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3390 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2110392978, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": +[ 3391 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3391 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3392 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3392 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1642 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1642 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.17/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1643 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3390 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2143423144, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": +[ 3395 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3395 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3396 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3396 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1644 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1643, 1644 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/Mul_output_0", "outputIndexes": +[ 1645 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1645 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3397 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3397 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3398 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3398 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2176453310, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": +[ 3399 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3399 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3400 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3400 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1646 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1640, 1646 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/Add_1_output_0", "outputIndexes": +[ 1647 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1647, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/Reshape_output_0", "outputIndexes": +[ 1648 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1648 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2209483476, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.18/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1649 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1649 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3401 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3401 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3402 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3402 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2209516244, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": +[ 3403 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3403 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3404 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3404 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1650 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1649 ] +, "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_output_0", "outputIndexes": +[ 1651 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1651 ] +, "main_type": "NONE", "name": "Shape2436", "outputIndexes": +[ 1652 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1651 ] +, "main_type": "NONE", "name": "Rank2438", "outputIndexes": +[ 1653 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1653, 1653 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2440", "outputIndexes": +[ 1654 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1654 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2441", "outputIndexes": +[ 1655 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1654, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2443", "outputIndexes": +[ 1656 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1656 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2444", "outputIndexes": +[ 1657 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1652, 1655, 1657, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2447", "outputIndexes": +[ 1658 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1658 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2448", "outputIndexes": +[ 1659 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1659, 1659 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2450", "outputIndexes": +[ 1660 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1651, 1660, 1654 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_output_0", "outputIndexes": +[ 1661 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1661, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1662 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1654 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2458", "outputIndexes": +[ 1663 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1656 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2461", "outputIndexes": +[ 1664 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1652, 1663, 1664, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2464", "outputIndexes": +[ 1665 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1665 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2465", "outputIndexes": +[ 1666 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1666 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2466", "outputIndexes": +[ 1667 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1667, 1666 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2467", "outputIndexes": +[ 1668 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1651, 1668, 1654 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_1_output_0", "outputIndexes": +[ 1669 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1669, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1670 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1662, 1670, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.18/self_attn/Concat_output_0", "outputIndexes": +[ 1671 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1650, 1671 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/self_attn/Reshape_output_0", "outputIndexes": +[ 1672 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1672, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_output_0", "outputIndexes": +[ 1673 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1672 ] +, "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_2_output_0", "outputIndexes": +[ 1674 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1674 ] +, "main_type": "NONE", "name": "Shape2474", "outputIndexes": +[ 1675 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1674 ] +, "main_type": "NONE", "name": "Rank2476", "outputIndexes": +[ 1676 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1676, 1676 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2478", "outputIndexes": +[ 1677 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1677 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2479", "outputIndexes": +[ 1678 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1677, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2481", "outputIndexes": +[ 1679 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1679 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2482", "outputIndexes": +[ 1680 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1675, 1678, 1680, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2485", "outputIndexes": +[ 1681 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1681 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2486", "outputIndexes": +[ 1682 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1682 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2487", "outputIndexes": +[ 1683 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1683, 1682 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2488", "outputIndexes": +[ 1684 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1674, 1684, 1677 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_2_output_0", "outputIndexes": +[ 1685 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1685, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Div_output_0", "outputIndexes": +[ 1686 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1686, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1687 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1672, 1687, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_1_output_0", "outputIndexes": +[ 1688 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1688 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.18/self_attn/Neg_output_0", "outputIndexes": +[ 1689 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1686, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1690 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1672, 20, 1690, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_output_0", "outputIndexes": +[ 1691 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1689, 1691 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.18/self_attn/Concat_3_output_0", "outputIndexes": +[ 1692 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1692, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_1_output_0", "outputIndexes": +[ 1693 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1673, 1693 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Add_output_0", "outputIndexes": +[ 1694 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3402 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2218953450, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": +[ 3407 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3407 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3408 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3408 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1695 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1661, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1696 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1669, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1697 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1696, 1697, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.18/self_attn/Concat_1_output_0", "outputIndexes": +[ 1698 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1695, 1698 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1699 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1699, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_2_output_0", "outputIndexes": +[ 1700 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1699 ] +, "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_3_output_0", "outputIndexes": +[ 1701 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1701 ] +, "main_type": "NONE", "name": "Shape2507", "outputIndexes": +[ 1702 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1701 ] +, "main_type": "NONE", "name": "Rank2509", "outputIndexes": +[ 1703 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1703, 1703 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2511", "outputIndexes": +[ 1704 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1704 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2512", "outputIndexes": +[ 1705 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1704, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2514", "outputIndexes": +[ 1706 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1706 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2515", "outputIndexes": +[ 1707 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1702, 1705, 1707, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2518", "outputIndexes": +[ 1708 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1708 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2519", "outputIndexes": +[ 1709 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1709 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2520", "outputIndexes": +[ 1710 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1710, 1709 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2521", "outputIndexes": +[ 1711 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1701, 1711, 1704 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_3_output_0", "outputIndexes": +[ 1712 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1712, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Div_1_output_0", "outputIndexes": +[ 1713 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1713, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1714 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1699, 1714, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_3_output_0", "outputIndexes": +[ 1715 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1715 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.18/self_attn/Neg_1_output_0", "outputIndexes": +[ 1716 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1713, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1717 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1699, 20, 1717, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_2_output_0", "outputIndexes": +[ 1718 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1716, 1718 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.18/self_attn/Concat_4_output_0", "outputIndexes": +[ 1719 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1719, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_3_output_0", "outputIndexes": +[ 1720 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1700, 1720 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Add_1_output_0", "outputIndexes": +[ 1721 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3402 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2221312768, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": +[ 3411 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3411 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3412 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3412 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1722 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1661, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1723 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1669, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1724 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1723, 1724, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.18/self_attn/Concat_2_output_0", "outputIndexes": +[ 1725 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1722, 1725 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1726 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1694, 1721, 1726, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.18/self_attn/FusedAttention", "outputIndexes": +[ 1727 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1727 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3413 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3413 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3414 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3414 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2223672086, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": +[ 3415 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3415 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3416 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3416 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1728 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1648, 1728 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/Add_output_0", "outputIndexes": +[ 1729 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1729 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2233109292, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.18/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1730 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1730 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3417 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3417 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3418 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3418 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2233142060, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": +[ 3419 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3419 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3420 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3420 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1731 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1731 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.18/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1732 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3418 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2266172226, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": +[ 3423 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3423 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3424 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3424 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1733 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1732, 1733 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/Mul_output_0", "outputIndexes": +[ 1734 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1734 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3425 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3425 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3426 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3426 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2299202392, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": +[ 3427 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3427 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3428 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3428 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1735 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1729, 1735 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/Add_1_output_0", "outputIndexes": +[ 1736 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1736, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/Reshape_output_0", "outputIndexes": +[ 1737 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1737 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2332232558, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.19/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1738 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1738 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3429 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3429 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3430 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3430 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2332265326, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": +[ 3431 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3431 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3432 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3432 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1739 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1738 ] +, "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_output_0", "outputIndexes": +[ 1740 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1740 ] +, "main_type": "NONE", "name": "Shape2567", "outputIndexes": +[ 1741 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1740 ] +, "main_type": "NONE", "name": "Rank2569", "outputIndexes": +[ 1742 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1742, 1742 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2571", "outputIndexes": +[ 1743 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1743 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2572", "outputIndexes": +[ 1744 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1743, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2574", "outputIndexes": +[ 1745 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1745 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2575", "outputIndexes": +[ 1746 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1741, 1744, 1746, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2578", "outputIndexes": +[ 1747 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1747 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2579", "outputIndexes": +[ 1748 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1748, 1748 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2581", "outputIndexes": +[ 1749 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1740, 1749, 1743 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_output_0", "outputIndexes": +[ 1750 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1750, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1751 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1743 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2589", "outputIndexes": +[ 1752 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1745 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2592", "outputIndexes": +[ 1753 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1741, 1752, 1753, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2595", "outputIndexes": +[ 1754 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1754 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2596", "outputIndexes": +[ 1755 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1755 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2597", "outputIndexes": +[ 1756 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1756, 1755 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2598", "outputIndexes": +[ 1757 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1740, 1757, 1743 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_1_output_0", "outputIndexes": +[ 1758 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1758, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1759 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1751, 1759, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.19/self_attn/Concat_output_0", "outputIndexes": +[ 1760 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1739, 1760 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/self_attn/Reshape_output_0", "outputIndexes": +[ 1761 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_output_0", "outputIndexes": +[ 1762 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761 ] +, "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_2_output_0", "outputIndexes": +[ 1763 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1763 ] +, "main_type": "NONE", "name": "Shape2605", "outputIndexes": +[ 1764 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1763 ] +, "main_type": "NONE", "name": "Rank2607", "outputIndexes": +[ 1765 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1765, 1765 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2609", "outputIndexes": +[ 1766 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1766 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2610", "outputIndexes": +[ 1767 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1766, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2612", "outputIndexes": +[ 1768 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1768 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2613", "outputIndexes": +[ 1769 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1764, 1767, 1769, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2616", "outputIndexes": +[ 1770 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1770 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2617", "outputIndexes": +[ 1771 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1771 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2618", "outputIndexes": +[ 1772 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1772, 1771 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2619", "outputIndexes": +[ 1773 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1763, 1773, 1766 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_2_output_0", "outputIndexes": +[ 1774 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1774, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Div_output_0", "outputIndexes": +[ 1775 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1775, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1776 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761, 1776, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_1_output_0", "outputIndexes": +[ 1777 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1777 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.19/self_attn/Neg_output_0", "outputIndexes": +[ 1778 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1775, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1779 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761, 20, 1779, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_output_0", "outputIndexes": +[ 1780 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1778, 1780 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.19/self_attn/Concat_3_output_0", "outputIndexes": +[ 1781 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1781, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_1_output_0", "outputIndexes": +[ 1782 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1762, 1782 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Add_output_0", "outputIndexes": +[ 1783 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3430 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2341702532, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": +[ 3435 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3435 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3436 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3436 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1784 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1750, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1785 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1758, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1786 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1785, 1786, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.19/self_attn/Concat_1_output_0", "outputIndexes": +[ 1787 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1784, 1787 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1788 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1788, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_2_output_0", "outputIndexes": +[ 1789 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1788 ] +, "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_3_output_0", "outputIndexes": +[ 1790 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1790 ] +, "main_type": "NONE", "name": "Shape2638", "outputIndexes": +[ 1791 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1790 ] +, "main_type": "NONE", "name": "Rank2640", "outputIndexes": +[ 1792 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1792, 1792 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2642", "outputIndexes": +[ 1793 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1793 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2643", "outputIndexes": +[ 1794 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1793, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2645", "outputIndexes": +[ 1795 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1795 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2646", "outputIndexes": +[ 1796 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1791, 1794, 1796, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2649", "outputIndexes": +[ 1797 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1797 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2650", "outputIndexes": +[ 1798 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1798 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2651", "outputIndexes": +[ 1799 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1799, 1798 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2652", "outputIndexes": +[ 1800 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1790, 1800, 1793 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_3_output_0", "outputIndexes": +[ 1801 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1801, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Div_1_output_0", "outputIndexes": +[ 1802 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1802, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1803 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1788, 1803, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_3_output_0", "outputIndexes": +[ 1804 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1804 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.19/self_attn/Neg_1_output_0", "outputIndexes": +[ 1805 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1802, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1806 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1788, 20, 1806, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_2_output_0", "outputIndexes": +[ 1807 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1805, 1807 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.19/self_attn/Concat_4_output_0", "outputIndexes": +[ 1808 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1808, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_3_output_0", "outputIndexes": +[ 1809 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1789, 1809 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Add_1_output_0", "outputIndexes": +[ 1810 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3430 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2344061850, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": +[ 3439 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3439 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3440 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3440 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1811 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1750, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1812 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1758, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1813 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1812, 1813, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.19/self_attn/Concat_2_output_0", "outputIndexes": +[ 1814 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1811, 1814 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1815 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1783, 1810, 1815, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.19/self_attn/FusedAttention", "outputIndexes": +[ 1816 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1816 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3441 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3441 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3442 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3442 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2346421168, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": +[ 3443 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3443 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3444 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3444 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1817 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1737, 1817 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/Add_output_0", "outputIndexes": +[ 1818 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1818 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2355858374, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.19/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1819 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1819 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3445 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3445 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3446 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3446 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2355891142, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": +[ 3447 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3447 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3448 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3448 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1820 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1820 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.19/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1821 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3446 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2388921308, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": +[ 3451 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3451 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3452 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3452 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1822 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1821, 1822 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/Mul_output_0", "outputIndexes": +[ 1823 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1823 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3453 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3453 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3454 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3454 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2421951474, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": +[ 3455 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3455 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3456 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3456 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1824 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1818, 1824 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/Add_1_output_0", "outputIndexes": +[ 1825 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1825, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/Reshape_output_0", "outputIndexes": +[ 1826 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1826 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2454981640, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.20/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1827 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1827 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3457 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3457 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3458 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3458 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2455014408, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": +[ 3459 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3459 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3460 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3460 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1828 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1827 ] +, "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_output_0", "outputIndexes": +[ 1829 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1829 ] +, "main_type": "NONE", "name": "Shape2698", "outputIndexes": +[ 1830 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1829 ] +, "main_type": "NONE", "name": "Rank2700", "outputIndexes": +[ 1831 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1831, 1831 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2702", "outputIndexes": +[ 1832 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1832 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2703", "outputIndexes": +[ 1833 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1832, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2705", "outputIndexes": +[ 1834 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1834 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2706", "outputIndexes": +[ 1835 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1830, 1833, 1835, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2709", "outputIndexes": +[ 1836 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1836 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2710", "outputIndexes": +[ 1837 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1837, 1837 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2712", "outputIndexes": +[ 1838 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1829, 1838, 1832 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_output_0", "outputIndexes": +[ 1839 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1839, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1840 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1832 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2720", "outputIndexes": +[ 1841 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1834 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2723", "outputIndexes": +[ 1842 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1830, 1841, 1842, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2726", "outputIndexes": +[ 1843 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1843 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2727", "outputIndexes": +[ 1844 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1844 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2728", "outputIndexes": +[ 1845 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1845, 1844 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2729", "outputIndexes": +[ 1846 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1829, 1846, 1832 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_1_output_0", "outputIndexes": +[ 1847 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1847, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1848 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1840, 1848, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.20/self_attn/Concat_output_0", "outputIndexes": +[ 1849 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1828, 1849 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/self_attn/Reshape_output_0", "outputIndexes": +[ 1850 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1850, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_output_0", "outputIndexes": +[ 1851 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1850 ] +, "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_2_output_0", "outputIndexes": +[ 1852 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1852 ] +, "main_type": "NONE", "name": "Shape2736", "outputIndexes": +[ 1853 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1852 ] +, "main_type": "NONE", "name": "Rank2738", "outputIndexes": +[ 1854 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1854, 1854 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2740", "outputIndexes": +[ 1855 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1855 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2741", "outputIndexes": +[ 1856 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1855, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2743", "outputIndexes": +[ 1857 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1857 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2744", "outputIndexes": +[ 1858 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1853, 1856, 1858, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2747", "outputIndexes": +[ 1859 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1859 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2748", "outputIndexes": +[ 1860 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1860 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2749", "outputIndexes": +[ 1861 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1861, 1860 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2750", "outputIndexes": +[ 1862 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1852, 1862, 1855 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_2_output_0", "outputIndexes": +[ 1863 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1863, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Div_output_0", "outputIndexes": +[ 1864 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1864, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1865 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1850, 1865, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_1_output_0", "outputIndexes": +[ 1866 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1866 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.20/self_attn/Neg_output_0", "outputIndexes": +[ 1867 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1864, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1868 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1850, 20, 1868, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_output_0", "outputIndexes": +[ 1869 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1867, 1869 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.20/self_attn/Concat_3_output_0", "outputIndexes": +[ 1870 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1870, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_1_output_0", "outputIndexes": +[ 1871 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1851, 1871 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Add_output_0", "outputIndexes": +[ 1872 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3458 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2464451614, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": +[ 3463 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3463 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3464 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3464 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1873 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1839, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1874 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1847, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1875 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1874, 1875, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.20/self_attn/Concat_1_output_0", "outputIndexes": +[ 1876 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1873, 1876 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1877 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1877, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_2_output_0", "outputIndexes": +[ 1878 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1877 ] +, "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_3_output_0", "outputIndexes": +[ 1879 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1879 ] +, "main_type": "NONE", "name": "Shape2769", "outputIndexes": +[ 1880 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1879 ] +, "main_type": "NONE", "name": "Rank2771", "outputIndexes": +[ 1881 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1881, 1881 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2773", "outputIndexes": +[ 1882 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1882 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2774", "outputIndexes": +[ 1883 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1882, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2776", "outputIndexes": +[ 1884 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1884 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2777", "outputIndexes": +[ 1885 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1880, 1883, 1885, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2780", "outputIndexes": +[ 1886 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1886 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2781", "outputIndexes": +[ 1887 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1887 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2782", "outputIndexes": +[ 1888 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1888, 1887 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2783", "outputIndexes": +[ 1889 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1879, 1889, 1882 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_3_output_0", "outputIndexes": +[ 1890 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1890, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Div_1_output_0", "outputIndexes": +[ 1891 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1891, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1892 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1877, 1892, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_3_output_0", "outputIndexes": +[ 1893 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1893 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.20/self_attn/Neg_1_output_0", "outputIndexes": +[ 1894 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1891, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1895 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1877, 20, 1895, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_2_output_0", "outputIndexes": +[ 1896 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1894, 1896 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.20/self_attn/Concat_4_output_0", "outputIndexes": +[ 1897 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1897, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_3_output_0", "outputIndexes": +[ 1898 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1878, 1898 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Add_1_output_0", "outputIndexes": +[ 1899 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3458 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2466810932, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": +[ 3467 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3467 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3468 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3468 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1900 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1839, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1901 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1847, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1902 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1901, 1902, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.20/self_attn/Concat_2_output_0", "outputIndexes": +[ 1903 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1900, 1903 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1904 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1872, 1899, 1904, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.20/self_attn/FusedAttention", "outputIndexes": +[ 1905 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1905 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3469 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3469 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3470 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3470 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2469170250, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": +[ 3471 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3471 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3472 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3472 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1906 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1826, 1906 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/Add_output_0", "outputIndexes": +[ 1907 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1907 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2478607456, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.20/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1908 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1908 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3473 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3473 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3474 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3474 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2478640224, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": +[ 3475 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3475 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3476 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3476 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1909 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1909 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.20/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1910 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3474 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2511670390, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": +[ 3479 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3479 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3480 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3480 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1911 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1910, 1911 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/Mul_output_0", "outputIndexes": +[ 1912 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1912 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3481 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3481 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3482 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3482 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2544700556, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": +[ 3483 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3483 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3484 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3484 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1913 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1907, 1913 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/Add_1_output_0", "outputIndexes": +[ 1914 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1914, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/Reshape_output_0", "outputIndexes": +[ 1915 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1915 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2577730722, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.21/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1916 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1916 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3485 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3485 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3486 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3486 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2577763490, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": +[ 3487 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3487 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3488 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3488 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1917 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1916 ] +, "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_output_0", "outputIndexes": +[ 1918 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1918 ] +, "main_type": "NONE", "name": "Shape2829", "outputIndexes": +[ 1919 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1918 ] +, "main_type": "NONE", "name": "Rank2831", "outputIndexes": +[ 1920 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1920, 1920 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2833", "outputIndexes": +[ 1921 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1921 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2834", "outputIndexes": +[ 1922 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1921, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2836", "outputIndexes": +[ 1923 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1923 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2837", "outputIndexes": +[ 1924 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1919, 1922, 1924, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2840", "outputIndexes": +[ 1925 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1925 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2841", "outputIndexes": +[ 1926 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1926, 1926 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2843", "outputIndexes": +[ 1927 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1918, 1927, 1921 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_output_0", "outputIndexes": +[ 1928 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1928, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1929 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1921 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2851", "outputIndexes": +[ 1930 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1923 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2854", "outputIndexes": +[ 1931 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1919, 1930, 1931, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2857", "outputIndexes": +[ 1932 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1932 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2858", "outputIndexes": +[ 1933 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 1933 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2859", "outputIndexes": +[ 1934 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1934, 1933 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2860", "outputIndexes": +[ 1935 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1918, 1935, 1921 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_1_output_0", "outputIndexes": +[ 1936 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1936, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1937 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1929, 1937, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.21/self_attn/Concat_output_0", "outputIndexes": +[ 1938 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1917, 1938 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/self_attn/Reshape_output_0", "outputIndexes": +[ 1939 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1939, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_output_0", "outputIndexes": +[ 1940 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1939 ] +, "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_2_output_0", "outputIndexes": +[ 1941 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1941 ] +, "main_type": "NONE", "name": "Shape2867", "outputIndexes": +[ 1942 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1941 ] +, "main_type": "NONE", "name": "Rank2869", "outputIndexes": +[ 1943 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1943, 1943 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2871", "outputIndexes": +[ 1944 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1944 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2872", "outputIndexes": +[ 1945 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1944, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2874", "outputIndexes": +[ 1946 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1946 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2875", "outputIndexes": +[ 1947 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1942, 1945, 1947, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2878", "outputIndexes": +[ 1948 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1948 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2879", "outputIndexes": +[ 1949 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1949 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2880", "outputIndexes": +[ 1950 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1950, 1949 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2881", "outputIndexes": +[ 1951 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1941, 1951, 1944 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_2_output_0", "outputIndexes": +[ 1952 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1952, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Div_output_0", "outputIndexes": +[ 1953 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1953, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1954 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1939, 1954, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_1_output_0", "outputIndexes": +[ 1955 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1955 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.21/self_attn/Neg_output_0", "outputIndexes": +[ 1956 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1953, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1957 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1939, 20, 1957, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_output_0", "outputIndexes": +[ 1958 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1956, 1958 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.21/self_attn/Concat_3_output_0", "outputIndexes": +[ 1959 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1959, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_1_output_0", "outputIndexes": +[ 1960 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1940, 1960 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Add_output_0", "outputIndexes": +[ 1961 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3486 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2587200696, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": +[ 3491 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3491 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3492 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3492 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1962 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1928, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1963 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1936, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1964 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1963, 1964, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.21/self_attn/Concat_1_output_0", "outputIndexes": +[ 1965 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1962, 1965 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1966 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1966, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_2_output_0", "outputIndexes": +[ 1967 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1966 ] +, "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_3_output_0", "outputIndexes": +[ 1968 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1968 ] +, "main_type": "NONE", "name": "Shape2900", "outputIndexes": +[ 1969 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1968 ] +, "main_type": "NONE", "name": "Rank2902", "outputIndexes": +[ 1970 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1970, 1970 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2904", "outputIndexes": +[ 1971 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1971 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2905", "outputIndexes": +[ 1972 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1971, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2907", "outputIndexes": +[ 1973 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1973 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2908", "outputIndexes": +[ 1974 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1969, 1972, 1974, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2911", "outputIndexes": +[ 1975 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1975 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2912", "outputIndexes": +[ 1976 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 1976 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2913", "outputIndexes": +[ 1977 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1977, 1976 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2914", "outputIndexes": +[ 1978 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1968, 1978, 1971 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_3_output_0", "outputIndexes": +[ 1979 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1979, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Div_1_output_0", "outputIndexes": +[ 1980 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1980, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1981 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1966, 1981, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_3_output_0", "outputIndexes": +[ 1982 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1982 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.21/self_attn/Neg_1_output_0", "outputIndexes": +[ 1983 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1980, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1984 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1966, 20, 1984, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_2_output_0", "outputIndexes": +[ 1985 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1983, 1985 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.21/self_attn/Concat_4_output_0", "outputIndexes": +[ 1986 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1986, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_3_output_0", "outputIndexes": +[ 1987 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1967, 1987 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Add_1_output_0", "outputIndexes": +[ 1988 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3486 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2589560014, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": +[ 3495 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3495 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3496 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3496 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1989 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1928, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1990 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1936, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1991 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1990, 1991, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.21/self_attn/Concat_2_output_0", "outputIndexes": +[ 1992 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1989, 1992 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1993 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1961, 1988, 1993, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.21/self_attn/FusedAttention", "outputIndexes": +[ 1994 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1994 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3497 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3497 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3498 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3498 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2591919332, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": +[ 3499 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3499 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3500 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3500 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1995 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1915, 1995 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/Add_output_0", "outputIndexes": +[ 1996 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1996 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2601356538, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.21/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1997 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1997 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3501 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3501 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3502 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3502 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2601389306, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": +[ 3503 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3503 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3504 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3504 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1998 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1998 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.21/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1999 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3502 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2634419472, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": +[ 3507 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3507 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3508 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3508 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2000 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1999, 2000 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/Mul_output_0", "outputIndexes": +[ 2001 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2001 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3509 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3509 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3510 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3510 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2667449638, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": +[ 3511 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3511 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3512 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3512 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2002 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1996, 2002 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/Add_1_output_0", "outputIndexes": +[ 2003 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2003, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/Reshape_output_0", "outputIndexes": +[ 2004 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2004 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2700479804, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.22/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2005 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2005 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3513 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3513 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3514 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3514 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2700512572, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": +[ 3515 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3515 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3516 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3516 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2006 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2005 ] +, "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_output_0", "outputIndexes": +[ 2007 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2007 ] +, "main_type": "NONE", "name": "Shape2960", "outputIndexes": +[ 2008 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2007 ] +, "main_type": "NONE", "name": "Rank2962", "outputIndexes": +[ 2009 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2009, 2009 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2964", "outputIndexes": +[ 2010 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2010 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2965", "outputIndexes": +[ 2011 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2010, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2967", "outputIndexes": +[ 2012 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2012 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2968", "outputIndexes": +[ 2013 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2008, 2011, 2013, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2971", "outputIndexes": +[ 2014 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2014 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2972", "outputIndexes": +[ 2015 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2015, 2015 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2974", "outputIndexes": +[ 2016 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2007, 2016, 2010 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_output_0", "outputIndexes": +[ 2017 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2017, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2018 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2010 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2982", "outputIndexes": +[ 2019 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2012 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2985", "outputIndexes": +[ 2020 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2008, 2019, 2020, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2988", "outputIndexes": +[ 2021 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2021 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2989", "outputIndexes": +[ 2022 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2022 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2990", "outputIndexes": +[ 2023 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2023, 2022 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2991", "outputIndexes": +[ 2024 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2007, 2024, 2010 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_1_output_0", "outputIndexes": +[ 2025 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2025, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2026 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2018, 2026, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.22/self_attn/Concat_output_0", "outputIndexes": +[ 2027 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2006, 2027 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/self_attn/Reshape_output_0", "outputIndexes": +[ 2028 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2028, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_output_0", "outputIndexes": +[ 2029 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2028 ] +, "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_2_output_0", "outputIndexes": +[ 2030 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2030 ] +, "main_type": "NONE", "name": "Shape2998", "outputIndexes": +[ 2031 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2030 ] +, "main_type": "NONE", "name": "Rank3000", "outputIndexes": +[ 2032 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2032, 2032 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3002", "outputIndexes": +[ 2033 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2033 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3003", "outputIndexes": +[ 2034 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2033, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3005", "outputIndexes": +[ 2035 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2035 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3006", "outputIndexes": +[ 2036 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2031, 2034, 2036, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3009", "outputIndexes": +[ 2037 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2037 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3010", "outputIndexes": +[ 2038 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2038 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3011", "outputIndexes": +[ 2039 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2039, 2038 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3012", "outputIndexes": +[ 2040 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2030, 2040, 2033 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_2_output_0", "outputIndexes": +[ 2041 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2041, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Div_output_0", "outputIndexes": +[ 2042 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2042, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2043 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2028, 2043, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_1_output_0", "outputIndexes": +[ 2044 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2044 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.22/self_attn/Neg_output_0", "outputIndexes": +[ 2045 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2042, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2046 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2028, 20, 2046, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_output_0", "outputIndexes": +[ 2047 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2045, 2047 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.22/self_attn/Concat_3_output_0", "outputIndexes": +[ 2048 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2048, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_1_output_0", "outputIndexes": +[ 2049 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2029, 2049 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Add_output_0", "outputIndexes": +[ 2050 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3514 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2709949778, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": +[ 3519 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3519 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3520 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3520 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2051 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2017, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2052 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2025, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2053 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2052, 2053, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.22/self_attn/Concat_1_output_0", "outputIndexes": +[ 2054 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2051, 2054 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2055 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2055, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_2_output_0", "outputIndexes": +[ 2056 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2055 ] +, "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_3_output_0", "outputIndexes": +[ 2057 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2057 ] +, "main_type": "NONE", "name": "Shape3031", "outputIndexes": +[ 2058 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2057 ] +, "main_type": "NONE", "name": "Rank3033", "outputIndexes": +[ 2059 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2059, 2059 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3035", "outputIndexes": +[ 2060 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2060 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3036", "outputIndexes": +[ 2061 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2060, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3038", "outputIndexes": +[ 2062 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2062 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3039", "outputIndexes": +[ 2063 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2058, 2061, 2063, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3042", "outputIndexes": +[ 2064 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2064 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3043", "outputIndexes": +[ 2065 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2065 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3044", "outputIndexes": +[ 2066 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2066, 2065 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3045", "outputIndexes": +[ 2067 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2057, 2067, 2060 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_3_output_0", "outputIndexes": +[ 2068 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2068, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Div_1_output_0", "outputIndexes": +[ 2069 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2069, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2070 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2055, 2070, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_3_output_0", "outputIndexes": +[ 2071 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2071 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.22/self_attn/Neg_1_output_0", "outputIndexes": +[ 2072 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2069, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2073 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2055, 20, 2073, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_2_output_0", "outputIndexes": +[ 2074 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2072, 2074 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.22/self_attn/Concat_4_output_0", "outputIndexes": +[ 2075 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2075, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_3_output_0", "outputIndexes": +[ 2076 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2056, 2076 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Add_1_output_0", "outputIndexes": +[ 2077 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3514 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2712309096, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": +[ 3523 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3523 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3524 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3524 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2078 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2017, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2079 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2025, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2080 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2079, 2080, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.22/self_attn/Concat_2_output_0", "outputIndexes": +[ 2081 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2078, 2081 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2082 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2050, 2077, 2082, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.22/self_attn/FusedAttention", "outputIndexes": +[ 2083 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2083 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3525 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3525 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3526 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3526 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2714668414, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": +[ 3527 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3527 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3528 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3528 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2084 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2004, 2084 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/Add_output_0", "outputIndexes": +[ 2085 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2085 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2724105620, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.22/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2086 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2086 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3529 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3529 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3530 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3530 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2724138388, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": +[ 3531 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3531 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3532 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3532 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2087 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2087 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.22/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2088 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3530 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2757168554, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": +[ 3535 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3535 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3536 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3536 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2089 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2088, 2089 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/Mul_output_0", "outputIndexes": +[ 2090 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2090 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3537 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3537 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3538 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3538 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2790198720, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": +[ 3539 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3539 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3540 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3540 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2091 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2085, 2091 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/Add_1_output_0", "outputIndexes": +[ 2092 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2092, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/Reshape_output_0", "outputIndexes": +[ 2093 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2093 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2823228886, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.23/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2094 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2094 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3541 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3541 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3542 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3542 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2823261654, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": +[ 3543 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3543 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3544 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3544 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2095 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2094 ] +, "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_output_0", "outputIndexes": +[ 2096 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2096 ] +, "main_type": "NONE", "name": "Shape3091", "outputIndexes": +[ 2097 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2096 ] +, "main_type": "NONE", "name": "Rank3093", "outputIndexes": +[ 2098 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2098, 2098 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3095", "outputIndexes": +[ 2099 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2099 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3096", "outputIndexes": +[ 2100 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2099, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3098", "outputIndexes": +[ 2101 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2101 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3099", "outputIndexes": +[ 2102 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2097, 2100, 2102, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3102", "outputIndexes": +[ 2103 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2103 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3103", "outputIndexes": +[ 2104 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2104, 2104 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3105", "outputIndexes": +[ 2105 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2096, 2105, 2099 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_output_0", "outputIndexes": +[ 2106 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2106, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2107 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2099 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3113", "outputIndexes": +[ 2108 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2101 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3116", "outputIndexes": +[ 2109 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2097, 2108, 2109, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3119", "outputIndexes": +[ 2110 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2110 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3120", "outputIndexes": +[ 2111 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2111 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3121", "outputIndexes": +[ 2112 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2112, 2111 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3122", "outputIndexes": +[ 2113 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2096, 2113, 2099 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_1_output_0", "outputIndexes": +[ 2114 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2114, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2115 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2107, 2115, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.23/self_attn/Concat_output_0", "outputIndexes": +[ 2116 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2095, 2116 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/self_attn/Reshape_output_0", "outputIndexes": +[ 2117 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2117, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_output_0", "outputIndexes": +[ 2118 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2117 ] +, "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_2_output_0", "outputIndexes": +[ 2119 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2119 ] +, "main_type": "NONE", "name": "Shape3129", "outputIndexes": +[ 2120 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2119 ] +, "main_type": "NONE", "name": "Rank3131", "outputIndexes": +[ 2121 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2121, 2121 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3133", "outputIndexes": +[ 2122 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2122 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3134", "outputIndexes": +[ 2123 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2122, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3136", "outputIndexes": +[ 2124 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2124 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3137", "outputIndexes": +[ 2125 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2120, 2123, 2125, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3140", "outputIndexes": +[ 2126 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2126 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3141", "outputIndexes": +[ 2127 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2127 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3142", "outputIndexes": +[ 2128 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2128, 2127 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3143", "outputIndexes": +[ 2129 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2119, 2129, 2122 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_2_output_0", "outputIndexes": +[ 2130 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2130, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Div_output_0", "outputIndexes": +[ 2131 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2131, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2132 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2117, 2132, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_1_output_0", "outputIndexes": +[ 2133 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2133 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.23/self_attn/Neg_output_0", "outputIndexes": +[ 2134 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2131, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2135 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2117, 20, 2135, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_output_0", "outputIndexes": +[ 2136 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2134, 2136 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.23/self_attn/Concat_3_output_0", "outputIndexes": +[ 2137 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2137, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_1_output_0", "outputIndexes": +[ 2138 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2118, 2138 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Add_output_0", "outputIndexes": +[ 2139 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3542 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2832698860, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": +[ 3547 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3547 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3548 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3548 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2140 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2106, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2141 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2114, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2142 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2141, 2142, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.23/self_attn/Concat_1_output_0", "outputIndexes": +[ 2143 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2140, 2143 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2144 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2144, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_2_output_0", "outputIndexes": +[ 2145 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2144 ] +, "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_3_output_0", "outputIndexes": +[ 2146 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2146 ] +, "main_type": "NONE", "name": "Shape3162", "outputIndexes": +[ 2147 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2146 ] +, "main_type": "NONE", "name": "Rank3164", "outputIndexes": +[ 2148 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2148, 2148 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3166", "outputIndexes": +[ 2149 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2149 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3167", "outputIndexes": +[ 2150 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2149, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3169", "outputIndexes": +[ 2151 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2151 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3170", "outputIndexes": +[ 2152 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2147, 2150, 2152, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3173", "outputIndexes": +[ 2153 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2153 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3174", "outputIndexes": +[ 2154 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2154 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3175", "outputIndexes": +[ 2155 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2155, 2154 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3176", "outputIndexes": +[ 2156 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2146, 2156, 2149 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_3_output_0", "outputIndexes": +[ 2157 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2157, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Div_1_output_0", "outputIndexes": +[ 2158 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2158, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2159 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2144, 2159, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_3_output_0", "outputIndexes": +[ 2160 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2160 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.23/self_attn/Neg_1_output_0", "outputIndexes": +[ 2161 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2158, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2162 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2144, 20, 2162, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_2_output_0", "outputIndexes": +[ 2163 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2161, 2163 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.23/self_attn/Concat_4_output_0", "outputIndexes": +[ 2164 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2164, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_3_output_0", "outputIndexes": +[ 2165 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2145, 2165 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Add_1_output_0", "outputIndexes": +[ 2166 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3542 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2835058178, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": +[ 3551 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3551 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3552 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3552 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2167 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2106, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2168 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2114, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2169 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2168, 2169, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.23/self_attn/Concat_2_output_0", "outputIndexes": +[ 2170 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2167, 2170 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2171 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2139, 2166, 2171, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.23/self_attn/FusedAttention", "outputIndexes": +[ 2172 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2172 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3553 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3553 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3554 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3554 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2837417496, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": +[ 3555 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3555 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3556 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3556 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2173 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2093, 2173 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/Add_output_0", "outputIndexes": +[ 2174 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2174 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2846854702, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.23/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2175 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2175 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3557 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3557 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3558 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3558 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2846887470, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": +[ 3559 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3559 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3560 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3560 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2176 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2176 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.23/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2177 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3558 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2879917636, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": +[ 3563 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3563 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3564 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3564 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2178 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2177, 2178 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/Mul_output_0", "outputIndexes": +[ 2179 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2179 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3565 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3565 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3566 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3566 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2912947802, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": +[ 3567 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3567 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3568 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3568 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2180 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2174, 2180 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/Add_1_output_0", "outputIndexes": +[ 2181 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2181, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/Reshape_output_0", "outputIndexes": +[ 2182 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2182 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2945977968, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.24/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2183 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2183 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3569 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3569 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3570 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3570 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2946010736, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": +[ 3571 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3571 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3572 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3572 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2184 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2183 ] +, "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_output_0", "outputIndexes": +[ 2185 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2185 ] +, "main_type": "NONE", "name": "Shape3222", "outputIndexes": +[ 2186 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2185 ] +, "main_type": "NONE", "name": "Rank3224", "outputIndexes": +[ 2187 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2187, 2187 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3226", "outputIndexes": +[ 2188 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2188 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3227", "outputIndexes": +[ 2189 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2188, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3229", "outputIndexes": +[ 2190 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2190 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3230", "outputIndexes": +[ 2191 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2186, 2189, 2191, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3233", "outputIndexes": +[ 2192 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2192 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3234", "outputIndexes": +[ 2193 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2193, 2193 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3236", "outputIndexes": +[ 2194 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2185, 2194, 2188 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_output_0", "outputIndexes": +[ 2195 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2195, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2196 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2188 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3244", "outputIndexes": +[ 2197 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2190 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3247", "outputIndexes": +[ 2198 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2186, 2197, 2198, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3250", "outputIndexes": +[ 2199 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2199 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3251", "outputIndexes": +[ 2200 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2200 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3252", "outputIndexes": +[ 2201 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2201, 2200 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3253", "outputIndexes": +[ 2202 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2185, 2202, 2188 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_1_output_0", "outputIndexes": +[ 2203 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2203, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2204 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2196, 2204, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.24/self_attn/Concat_output_0", "outputIndexes": +[ 2205 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2184, 2205 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/self_attn/Reshape_output_0", "outputIndexes": +[ 2206 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2206, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_output_0", "outputIndexes": +[ 2207 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2206 ] +, "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_2_output_0", "outputIndexes": +[ 2208 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2208 ] +, "main_type": "NONE", "name": "Shape3260", "outputIndexes": +[ 2209 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2208 ] +, "main_type": "NONE", "name": "Rank3262", "outputIndexes": +[ 2210 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2210, 2210 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3264", "outputIndexes": +[ 2211 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2211 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3265", "outputIndexes": +[ 2212 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2211, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3267", "outputIndexes": +[ 2213 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2213 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3268", "outputIndexes": +[ 2214 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2209, 2212, 2214, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3271", "outputIndexes": +[ 2215 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2215 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3272", "outputIndexes": +[ 2216 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2216 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3273", "outputIndexes": +[ 2217 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2217, 2216 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3274", "outputIndexes": +[ 2218 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2208, 2218, 2211 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_2_output_0", "outputIndexes": +[ 2219 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2219, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Div_output_0", "outputIndexes": +[ 2220 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2220, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2221 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2206, 2221, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_1_output_0", "outputIndexes": +[ 2222 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2222 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.24/self_attn/Neg_output_0", "outputIndexes": +[ 2223 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2220, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2224 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2206, 20, 2224, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_output_0", "outputIndexes": +[ 2225 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2223, 2225 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.24/self_attn/Concat_3_output_0", "outputIndexes": +[ 2226 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2226, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_1_output_0", "outputIndexes": +[ 2227 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2207, 2227 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Add_output_0", "outputIndexes": +[ 2228 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3570 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2955447942, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": +[ 3575 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3575 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3576 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3576 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2229 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2195, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2230 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2203, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2231 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2230, 2231, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.24/self_attn/Concat_1_output_0", "outputIndexes": +[ 2232 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2229, 2232 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2233 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2233, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_2_output_0", "outputIndexes": +[ 2234 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2233 ] +, "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_3_output_0", "outputIndexes": +[ 2235 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2235 ] +, "main_type": "NONE", "name": "Shape3293", "outputIndexes": +[ 2236 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2235 ] +, "main_type": "NONE", "name": "Rank3295", "outputIndexes": +[ 2237 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2237, 2237 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3297", "outputIndexes": +[ 2238 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2238 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3298", "outputIndexes": +[ 2239 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2238, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3300", "outputIndexes": +[ 2240 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2240 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3301", "outputIndexes": +[ 2241 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2236, 2239, 2241, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3304", "outputIndexes": +[ 2242 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2242 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3305", "outputIndexes": +[ 2243 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2243 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3306", "outputIndexes": +[ 2244 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2244, 2243 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3307", "outputIndexes": +[ 2245 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2235, 2245, 2238 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_3_output_0", "outputIndexes": +[ 2246 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2246, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Div_1_output_0", "outputIndexes": +[ 2247 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2247, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2248 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2233, 2248, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_3_output_0", "outputIndexes": +[ 2249 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2249 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.24/self_attn/Neg_1_output_0", "outputIndexes": +[ 2250 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2247, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2251 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2233, 20, 2251, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_2_output_0", "outputIndexes": +[ 2252 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2250, 2252 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.24/self_attn/Concat_4_output_0", "outputIndexes": +[ 2253 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2253, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_3_output_0", "outputIndexes": +[ 2254 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2234, 2254 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Add_1_output_0", "outputIndexes": +[ 2255 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3570 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2957807260, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": +[ 3579 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3579 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3580 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3580 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2256 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2195, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2257 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2203, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2258 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2257, 2258, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.24/self_attn/Concat_2_output_0", "outputIndexes": +[ 2259 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2256, 2259 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2260 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2228, 2255, 2260, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.24/self_attn/FusedAttention", "outputIndexes": +[ 2261 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2261 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3581 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3581 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3582 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3582 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2960166578, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": +[ 3583 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3583 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3584 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3584 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2262 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2182, 2262 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/Add_output_0", "outputIndexes": +[ 2263 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2263 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 2969603784, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.24/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2264 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2264 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3585 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3585 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3586 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3586 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 2969636552, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": +[ 3587 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3587 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3588 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3588 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2265 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2265 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.24/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2266 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3586 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3002666718, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": +[ 3591 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3591 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3592 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3592 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2267 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2266, 2267 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/Mul_output_0", "outputIndexes": +[ 2268 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2268 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3593 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3593 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3594 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3594 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3035696884, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": +[ 3595 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3595 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3596 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3596 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2269 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2263, 2269 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/Add_1_output_0", "outputIndexes": +[ 2270 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2270, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/Reshape_output_0", "outputIndexes": +[ 2271 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2271 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3068727050, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.25/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2272 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2272 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3597 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3597 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3598 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3598 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3068759818, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": +[ 3599 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3599 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3600 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3600 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2273 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2272 ] +, "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_output_0", "outputIndexes": +[ 2274 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2274 ] +, "main_type": "NONE", "name": "Shape3353", "outputIndexes": +[ 2275 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2274 ] +, "main_type": "NONE", "name": "Rank3355", "outputIndexes": +[ 2276 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2276, 2276 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3357", "outputIndexes": +[ 2277 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2277 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3358", "outputIndexes": +[ 2278 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2277, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3360", "outputIndexes": +[ 2279 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2279 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3361", "outputIndexes": +[ 2280 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2275, 2278, 2280, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3364", "outputIndexes": +[ 2281 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2281 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3365", "outputIndexes": +[ 2282 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2282, 2282 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3367", "outputIndexes": +[ 2283 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2274, 2283, 2277 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_output_0", "outputIndexes": +[ 2284 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2284, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2285 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2277 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3375", "outputIndexes": +[ 2286 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2279 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3378", "outputIndexes": +[ 2287 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2275, 2286, 2287, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3381", "outputIndexes": +[ 2288 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2288 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3382", "outputIndexes": +[ 2289 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2289 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3383", "outputIndexes": +[ 2290 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2290, 2289 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3384", "outputIndexes": +[ 2291 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2274, 2291, 2277 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_1_output_0", "outputIndexes": +[ 2292 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2292, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2293 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2285, 2293, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.25/self_attn/Concat_output_0", "outputIndexes": +[ 2294 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2273, 2294 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/self_attn/Reshape_output_0", "outputIndexes": +[ 2295 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2295, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_output_0", "outputIndexes": +[ 2296 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2295 ] +, "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_2_output_0", "outputIndexes": +[ 2297 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2297 ] +, "main_type": "NONE", "name": "Shape3391", "outputIndexes": +[ 2298 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2297 ] +, "main_type": "NONE", "name": "Rank3393", "outputIndexes": +[ 2299 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2299, 2299 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3395", "outputIndexes": +[ 2300 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2300 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3396", "outputIndexes": +[ 2301 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2300, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3398", "outputIndexes": +[ 2302 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2302 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3399", "outputIndexes": +[ 2303 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2298, 2301, 2303, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3402", "outputIndexes": +[ 2304 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2304 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3403", "outputIndexes": +[ 2305 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2305 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3404", "outputIndexes": +[ 2306 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2306, 2305 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3405", "outputIndexes": +[ 2307 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2297, 2307, 2300 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_2_output_0", "outputIndexes": +[ 2308 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2308, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Div_output_0", "outputIndexes": +[ 2309 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2309, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2310 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2295, 2310, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_1_output_0", "outputIndexes": +[ 2311 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2311 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.25/self_attn/Neg_output_0", "outputIndexes": +[ 2312 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2309, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2313 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2295, 20, 2313, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_output_0", "outputIndexes": +[ 2314 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2312, 2314 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.25/self_attn/Concat_3_output_0", "outputIndexes": +[ 2315 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2315, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_1_output_0", "outputIndexes": +[ 2316 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2296, 2316 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Add_output_0", "outputIndexes": +[ 2317 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3598 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3078197024, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": +[ 3603 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3603 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3604 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3604 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2318 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2284, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2319 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2292, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2320 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2319, 2320, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.25/self_attn/Concat_1_output_0", "outputIndexes": +[ 2321 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2318, 2321 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2322 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2322, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_2_output_0", "outputIndexes": +[ 2323 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2322 ] +, "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_3_output_0", "outputIndexes": +[ 2324 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2324 ] +, "main_type": "NONE", "name": "Shape3424", "outputIndexes": +[ 2325 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2324 ] +, "main_type": "NONE", "name": "Rank3426", "outputIndexes": +[ 2326 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2326, 2326 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3428", "outputIndexes": +[ 2327 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2327 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3429", "outputIndexes": +[ 2328 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2327, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3431", "outputIndexes": +[ 2329 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2329 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3432", "outputIndexes": +[ 2330 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2325, 2328, 2330, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3435", "outputIndexes": +[ 2331 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2331 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3436", "outputIndexes": +[ 2332 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2332 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3437", "outputIndexes": +[ 2333 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2333, 2332 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3438", "outputIndexes": +[ 2334 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2324, 2334, 2327 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_3_output_0", "outputIndexes": +[ 2335 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2335, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Div_1_output_0", "outputIndexes": +[ 2336 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2336, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2337 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2322, 2337, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_3_output_0", "outputIndexes": +[ 2338 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2338 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.25/self_attn/Neg_1_output_0", "outputIndexes": +[ 2339 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2336, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2340 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2322, 20, 2340, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_2_output_0", "outputIndexes": +[ 2341 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2339, 2341 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.25/self_attn/Concat_4_output_0", "outputIndexes": +[ 2342 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2342, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_3_output_0", "outputIndexes": +[ 2343 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2323, 2343 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Add_1_output_0", "outputIndexes": +[ 2344 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3598 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3080556342, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": +[ 3607 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3607 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3608 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3608 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2345 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2284, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2346 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2292, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2347 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2346, 2347, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.25/self_attn/Concat_2_output_0", "outputIndexes": +[ 2348 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2345, 2348 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2349 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2317, 2344, 2349, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.25/self_attn/FusedAttention", "outputIndexes": +[ 2350 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2350 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3609 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3609 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3610 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3610 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3082915660, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": +[ 3611 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3611 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3612 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3612 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2351 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2271, 2351 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/Add_output_0", "outputIndexes": +[ 2352 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2352 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3092352866, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.25/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2353 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2353 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3613 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3613 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3614 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3614 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3092385634, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": +[ 3615 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3615 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3616 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3616 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2354 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2354 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.25/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2355 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3614 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3125415800, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": +[ 3619 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3619 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3620 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3620 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2356 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2355, 2356 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/Mul_output_0", "outputIndexes": +[ 2357 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2357 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3621 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3621 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3622 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3622 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3158445966, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": +[ 3623 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3623 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3624 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3624 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2358 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2352, 2358 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/Add_1_output_0", "outputIndexes": +[ 2359 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2359, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.26/Reshape_output_0", "outputIndexes": +[ 2360 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2360 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3191476132, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.26/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2361 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2361 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3625 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3625 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3626 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3626 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3191508900, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.26/self_attn/q_proj/Linear", "outputIndexes": +[ 3627 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3627 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3628 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3628 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2362 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2361 ] +, "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_output_0", "outputIndexes": +[ 2363 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2363 ] +, "main_type": "NONE", "name": "Shape3484", "outputIndexes": +[ 2364 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2363 ] +, "main_type": "NONE", "name": "Rank3486", "outputIndexes": +[ 2365 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2365, 2365 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3488", "outputIndexes": +[ 2366 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2366 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3489", "outputIndexes": +[ 2367 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2366, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3491", "outputIndexes": +[ 2368 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2368 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3492", "outputIndexes": +[ 2369 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2364, 2367, 2369, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3495", "outputIndexes": +[ 2370 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2370 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3496", "outputIndexes": +[ 2371 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2371, 2371 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3498", "outputIndexes": +[ 2372 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2363, 2372, 2366 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.26/self_attn/Gather_output_0", "outputIndexes": +[ 2373 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2373, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2374 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2366 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3506", "outputIndexes": +[ 2375 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2368 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3509", "outputIndexes": +[ 2376 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2364, 2375, 2376, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3512", "outputIndexes": +[ 2377 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2377 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3513", "outputIndexes": +[ 2378 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2378 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3514", "outputIndexes": +[ 2379 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2379, 2378 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3515", "outputIndexes": +[ 2380 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2363, 2380, 2366 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.26/self_attn/Gather_1_output_0", "outputIndexes": +[ 2381 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2381, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2382 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2374, 2382, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.26/self_attn/Concat_output_0", "outputIndexes": +[ 2383 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2362, 2383 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.26/self_attn/Reshape_output_0", "outputIndexes": +[ 2384 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2384, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Mul_output_0", "outputIndexes": +[ 2385 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2384 ] +, "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_2_output_0", "outputIndexes": +[ 2386 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2386 ] +, "main_type": "NONE", "name": "Shape3522", "outputIndexes": +[ 2387 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2386 ] +, "main_type": "NONE", "name": "Rank3524", "outputIndexes": +[ 2388 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2388, 2388 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3526", "outputIndexes": +[ 2389 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2389 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3527", "outputIndexes": +[ 2390 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2389, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3529", "outputIndexes": +[ 2391 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2391 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3530", "outputIndexes": +[ 2392 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2387, 2390, 2392, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3533", "outputIndexes": +[ 2393 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2393 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3534", "outputIndexes": +[ 2394 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2394 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3535", "outputIndexes": +[ 2395 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2395, 2394 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3536", "outputIndexes": +[ 2396 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2386, 2396, 2389 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.26/self_attn/Gather_2_output_0", "outputIndexes": +[ 2397 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2397, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Div_output_0", "outputIndexes": +[ 2398 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2398, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2399 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2384, 2399, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.26/self_attn/Slice_1_output_0", "outputIndexes": +[ 2400 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2400 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.26/self_attn/Neg_output_0", "outputIndexes": +[ 2401 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2398, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2402 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2384, 20, 2402, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.26/self_attn/Slice_output_0", "outputIndexes": +[ 2403 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2401, 2403 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.26/self_attn/Concat_3_output_0", "outputIndexes": +[ 2404 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2404, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Mul_1_output_0", "outputIndexes": +[ 2405 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2385, 2405 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Add_output_0", "outputIndexes": +[ 2406 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3626 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3200946106, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.26/self_attn/k_proj/Linear", "outputIndexes": +[ 3631 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3631 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3632 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3632 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2407 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2373, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2408 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2381, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2409 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2408, 2409, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.26/self_attn/Concat_1_output_0", "outputIndexes": +[ 2410 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2407, 2410 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.26/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2411 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2411, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Mul_2_output_0", "outputIndexes": +[ 2412 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2411 ] +, "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_3_output_0", "outputIndexes": +[ 2413 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2413 ] +, "main_type": "NONE", "name": "Shape3555", "outputIndexes": +[ 2414 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2413 ] +, "main_type": "NONE", "name": "Rank3557", "outputIndexes": +[ 2415 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2415, 2415 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3559", "outputIndexes": +[ 2416 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2416 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3560", "outputIndexes": +[ 2417 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2416, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3562", "outputIndexes": +[ 2418 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2418 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3563", "outputIndexes": +[ 2419 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2414, 2417, 2419, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3566", "outputIndexes": +[ 2420 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2420 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3567", "outputIndexes": +[ 2421 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2421 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3568", "outputIndexes": +[ 2422 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2422, 2421 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3569", "outputIndexes": +[ 2423 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2413, 2423, 2416 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.26/self_attn/Gather_3_output_0", "outputIndexes": +[ 2424 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2424, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Div_1_output_0", "outputIndexes": +[ 2425 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2425, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2426 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2411, 2426, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.26/self_attn/Slice_3_output_0", "outputIndexes": +[ 2427 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2427 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.26/self_attn/Neg_1_output_0", "outputIndexes": +[ 2428 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2425, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2429 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2411, 20, 2429, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.26/self_attn/Slice_2_output_0", "outputIndexes": +[ 2430 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2428, 2430 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.26/self_attn/Concat_4_output_0", "outputIndexes": +[ 2431 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2431, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Mul_3_output_0", "outputIndexes": +[ 2432 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2412, 2432 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/self_attn/Add_1_output_0", "outputIndexes": +[ 2433 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3626 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3203305424, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.26/self_attn/v_proj/Linear", "outputIndexes": +[ 3635 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3635 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3636 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3636 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2434 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2373, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2435 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2381, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.26/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2436 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2435, 2436, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.26/self_attn/Concat_2_output_0", "outputIndexes": +[ 2437 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2434, 2437 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.26/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2438 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2406, 2433, 2438, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.26/self_attn/FusedAttention", "outputIndexes": +[ 2439 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2439 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3637 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3637 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3638 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3638 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3205664742, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.26/self_attn/o_proj/Linear", "outputIndexes": +[ 3639 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3639 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3640 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3640 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2440 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2360, 2440 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/Add_output_0", "outputIndexes": +[ 2441 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2441 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3215101948, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.26/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2442 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2442 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3641 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3641 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3642 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3642 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3215134716, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.26/mlp/gate_proj/Linear", "outputIndexes": +[ 3643 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3643 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3644 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3644 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2443 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2443 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.26/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2444 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3642 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3248164882, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.26/mlp/up_proj/Linear", "outputIndexes": +[ 3647 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3647 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3648 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3648 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2445 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2444, 2445 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/mlp/Mul_output_0", "outputIndexes": +[ 2446 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2446 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3649 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3649 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3650 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3650 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3281195048, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.26/mlp/down_proj/Linear", "outputIndexes": +[ 3651 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3651 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.26/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3652 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3652 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2447 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2441, 2447 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.26/Add_1_output_0", "outputIndexes": +[ 2448 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2448, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.27/Reshape_output_0", "outputIndexes": +[ 2449 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2449 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3314225214, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.27/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2450 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2450 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3653 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3653 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3654 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3654 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3314257982, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.27/self_attn/q_proj/Linear", "outputIndexes": +[ 3655 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3655 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3656 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3656 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2451 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2450 ] +, "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_output_0", "outputIndexes": +[ 2452 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2452 ] +, "main_type": "NONE", "name": "Shape3615", "outputIndexes": +[ 2453 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2452 ] +, "main_type": "NONE", "name": "Rank3617", "outputIndexes": +[ 2454 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2454, 2454 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3619", "outputIndexes": +[ 2455 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2455 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3620", "outputIndexes": +[ 2456 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2455, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3622", "outputIndexes": +[ 2457 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2457 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3623", "outputIndexes": +[ 2458 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2453, 2456, 2458, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3626", "outputIndexes": +[ 2459 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2459 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3627", "outputIndexes": +[ 2460 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2460, 2460 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3629", "outputIndexes": +[ 2461 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2452, 2461, 2455 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.27/self_attn/Gather_output_0", "outputIndexes": +[ 2462 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2462, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2463 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2455 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3637", "outputIndexes": +[ 2464 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2457 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3640", "outputIndexes": +[ 2465 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2453, 2464, 2465, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3643", "outputIndexes": +[ 2466 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2466 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3644", "outputIndexes": +[ 2467 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2467 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3645", "outputIndexes": +[ 2468 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2468, 2467 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3646", "outputIndexes": +[ 2469 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2452, 2469, 2455 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.27/self_attn/Gather_1_output_0", "outputIndexes": +[ 2470 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2470, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2471 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2463, 2471, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.27/self_attn/Concat_output_0", "outputIndexes": +[ 2472 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2451, 2472 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.27/self_attn/Reshape_output_0", "outputIndexes": +[ 2473 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2473, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Mul_output_0", "outputIndexes": +[ 2474 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2473 ] +, "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_2_output_0", "outputIndexes": +[ 2475 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2475 ] +, "main_type": "NONE", "name": "Shape3653", "outputIndexes": +[ 2476 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2475 ] +, "main_type": "NONE", "name": "Rank3655", "outputIndexes": +[ 2477 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2477, 2477 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3657", "outputIndexes": +[ 2478 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2478 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3658", "outputIndexes": +[ 2479 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2478, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3660", "outputIndexes": +[ 2480 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2480 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3661", "outputIndexes": +[ 2481 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2476, 2479, 2481, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3664", "outputIndexes": +[ 2482 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2482 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3665", "outputIndexes": +[ 2483 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2483 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3666", "outputIndexes": +[ 2484 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2484, 2483 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3667", "outputIndexes": +[ 2485 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2475, 2485, 2478 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.27/self_attn/Gather_2_output_0", "outputIndexes": +[ 2486 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2486, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Div_output_0", "outputIndexes": +[ 2487 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2487, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2488 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2473, 2488, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.27/self_attn/Slice_1_output_0", "outputIndexes": +[ 2489 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2489 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.27/self_attn/Neg_output_0", "outputIndexes": +[ 2490 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2487, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2491 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2473, 20, 2491, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.27/self_attn/Slice_output_0", "outputIndexes": +[ 2492 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2490, 2492 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.27/self_attn/Concat_3_output_0", "outputIndexes": +[ 2493 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2493, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Mul_1_output_0", "outputIndexes": +[ 2494 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2474, 2494 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Add_output_0", "outputIndexes": +[ 2495 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3654 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3323695188, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.27/self_attn/k_proj/Linear", "outputIndexes": +[ 3659 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3659 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3660 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3660 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2496 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2462, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2497 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2470, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2498 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2497, 2498, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.27/self_attn/Concat_1_output_0", "outputIndexes": +[ 2499 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2496, 2499 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.27/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2500 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2500, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Mul_2_output_0", "outputIndexes": +[ 2501 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2500 ] +, "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_3_output_0", "outputIndexes": +[ 2502 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2502 ] +, "main_type": "NONE", "name": "Shape3686", "outputIndexes": +[ 2503 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2502 ] +, "main_type": "NONE", "name": "Rank3688", "outputIndexes": +[ 2504 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2504, 2504 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3690", "outputIndexes": +[ 2505 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2505 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3691", "outputIndexes": +[ 2506 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2505, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3693", "outputIndexes": +[ 2507 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2507 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3694", "outputIndexes": +[ 2508 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2503, 2506, 2508, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3697", "outputIndexes": +[ 2509 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2509 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3698", "outputIndexes": +[ 2510 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2510 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3699", "outputIndexes": +[ 2511 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2511, 2510 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3700", "outputIndexes": +[ 2512 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2502, 2512, 2505 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.27/self_attn/Gather_3_output_0", "outputIndexes": +[ 2513 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2513, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Div_1_output_0", "outputIndexes": +[ 2514 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2514, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2515 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2500, 2515, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.27/self_attn/Slice_3_output_0", "outputIndexes": +[ 2516 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2516 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.27/self_attn/Neg_1_output_0", "outputIndexes": +[ 2517 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2514, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2518 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2500, 20, 2518, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.27/self_attn/Slice_2_output_0", "outputIndexes": +[ 2519 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2517, 2519 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.27/self_attn/Concat_4_output_0", "outputIndexes": +[ 2520 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2520, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Mul_3_output_0", "outputIndexes": +[ 2521 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2501, 2521 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/self_attn/Add_1_output_0", "outputIndexes": +[ 2522 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3654 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3326054506, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.27/self_attn/v_proj/Linear", "outputIndexes": +[ 3663 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3663 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3664 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3664 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2523 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2462, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2524 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2470, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.27/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2525 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2524, 2525, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.27/self_attn/Concat_2_output_0", "outputIndexes": +[ 2526 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2523, 2526 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.27/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2527 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2495, 2522, 2527, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.27/self_attn/FusedAttention", "outputIndexes": +[ 2528 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2528 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3665 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3665 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3666 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3666 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3328413824, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.27/self_attn/o_proj/Linear", "outputIndexes": +[ 3667 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3667 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3668 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3668 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2529 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2449, 2529 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/Add_output_0", "outputIndexes": +[ 2530 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2530 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3337851030, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.27/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2531 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2531 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3669 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3669 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3670 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3670 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3337883798, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.27/mlp/gate_proj/Linear", "outputIndexes": +[ 3671 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3671 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3672 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3672 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2532 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2532 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.27/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2533 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3670 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3370913964, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.27/mlp/up_proj/Linear", "outputIndexes": +[ 3675 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3675 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3676 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3676 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2534 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2533, 2534 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/mlp/Mul_output_0", "outputIndexes": +[ 2535 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2535 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3677 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3677 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3678 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3678 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3403944130, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.27/mlp/down_proj/Linear", "outputIndexes": +[ 3679 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3679 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.27/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3680 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3680 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2536 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2530, 2536 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.27/Add_1_output_0", "outputIndexes": +[ 2537 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2537, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.28/Reshape_output_0", "outputIndexes": +[ 2538 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2538 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3436974296, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.28/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2539 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2539 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.28/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3681 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3681 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.28/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3682 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3682 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3437007064, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.28/self_attn/q_proj/Linear", "outputIndexes": +[ 3683 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3683 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3684 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3684 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.28/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2540 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2539 ] +, "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_output_0", "outputIndexes": +[ 2541 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2541 ] +, "main_type": "NONE", "name": "Shape3746", "outputIndexes": +[ 2542 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2541 ] +, "main_type": "NONE", "name": "Rank3748", "outputIndexes": +[ 2543 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2543, 2543 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3750", "outputIndexes": +[ 2544 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3751", "outputIndexes": +[ 2545 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3753", "outputIndexes": +[ 2546 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2546 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3754", "outputIndexes": +[ 2547 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2542, 2545, 2547, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3757", "outputIndexes": +[ 2548 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2548 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3758", "outputIndexes": +[ 2549 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2549, 2549 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3760", "outputIndexes": +[ 2550 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2541, 2550, 2544 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.28/self_attn/Gather_output_0", "outputIndexes": +[ 2551 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2551, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2552 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3768", "outputIndexes": +[ 2553 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2546 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3771", "outputIndexes": +[ 2554 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2542, 2553, 2554, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3774", "outputIndexes": +[ 2555 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2555 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3775", "outputIndexes": +[ 2556 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2556 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3776", "outputIndexes": +[ 2557 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2557, 2556 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3777", "outputIndexes": +[ 2558 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2541, 2558, 2544 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.28/self_attn/Gather_1_output_0", "outputIndexes": +[ 2559 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2559, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2560 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2552, 2560, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.28/self_attn/Concat_output_0", "outputIndexes": +[ 2561 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2540, 2561 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.28/self_attn/Reshape_output_0", "outputIndexes": +[ 2562 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2562, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Mul_output_0", "outputIndexes": +[ 2563 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2562 ] +, "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_2_output_0", "outputIndexes": +[ 2564 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2564 ] +, "main_type": "NONE", "name": "Shape3784", "outputIndexes": +[ 2565 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2564 ] +, "main_type": "NONE", "name": "Rank3786", "outputIndexes": +[ 2566 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2566, 2566 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3788", "outputIndexes": +[ 2567 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2567 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3789", "outputIndexes": +[ 2568 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2567, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3791", "outputIndexes": +[ 2569 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2569 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3792", "outputIndexes": +[ 2570 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2565, 2568, 2570, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3795", "outputIndexes": +[ 2571 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2571 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3796", "outputIndexes": +[ 2572 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2572 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3797", "outputIndexes": +[ 2573 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2573, 2572 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3798", "outputIndexes": +[ 2574 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2564, 2574, 2567 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.28/self_attn/Gather_2_output_0", "outputIndexes": +[ 2575 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2575, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Div_output_0", "outputIndexes": +[ 2576 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2576, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2577 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2562, 2577, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.28/self_attn/Slice_1_output_0", "outputIndexes": +[ 2578 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2578 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.28/self_attn/Neg_output_0", "outputIndexes": +[ 2579 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2576, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2580 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2562, 20, 2580, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.28/self_attn/Slice_output_0", "outputIndexes": +[ 2581 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2579, 2581 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.28/self_attn/Concat_3_output_0", "outputIndexes": +[ 2582 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2582, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Mul_1_output_0", "outputIndexes": +[ 2583 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2563, 2583 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Add_output_0", "outputIndexes": +[ 2584 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3682 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3446444270, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.28/self_attn/k_proj/Linear", "outputIndexes": +[ 3687 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3687 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3688 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3688 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.28/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2585 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2551, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2586 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2559, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2587 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2586, 2587, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.28/self_attn/Concat_1_output_0", "outputIndexes": +[ 2588 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2585, 2588 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.28/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2589 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2589, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Mul_2_output_0", "outputIndexes": +[ 2590 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2589 ] +, "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_3_output_0", "outputIndexes": +[ 2591 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2591 ] +, "main_type": "NONE", "name": "Shape3817", "outputIndexes": +[ 2592 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2591 ] +, "main_type": "NONE", "name": "Rank3819", "outputIndexes": +[ 2593 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2593, 2593 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3821", "outputIndexes": +[ 2594 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2594 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3822", "outputIndexes": +[ 2595 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2594, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3824", "outputIndexes": +[ 2596 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2596 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3825", "outputIndexes": +[ 2597 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2592, 2595, 2597, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3828", "outputIndexes": +[ 2598 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2598 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3829", "outputIndexes": +[ 2599 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2599 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3830", "outputIndexes": +[ 2600 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2600, 2599 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3831", "outputIndexes": +[ 2601 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2591, 2601, 2594 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.28/self_attn/Gather_3_output_0", "outputIndexes": +[ 2602 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2602, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Div_1_output_0", "outputIndexes": +[ 2603 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2603, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2604 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2589, 2604, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.28/self_attn/Slice_3_output_0", "outputIndexes": +[ 2605 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2605 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.28/self_attn/Neg_1_output_0", "outputIndexes": +[ 2606 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2603, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2607 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2589, 20, 2607, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.28/self_attn/Slice_2_output_0", "outputIndexes": +[ 2608 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2606, 2608 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.28/self_attn/Concat_4_output_0", "outputIndexes": +[ 2609 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2609, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Mul_3_output_0", "outputIndexes": +[ 2610 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2590, 2610 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/self_attn/Add_1_output_0", "outputIndexes": +[ 2611 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3682 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3448803588, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.28/self_attn/v_proj/Linear", "outputIndexes": +[ 3691 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3691 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3692 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3692 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.28/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2612 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2551, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2613 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2559, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.28/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2614 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2613, 2614, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.28/self_attn/Concat_2_output_0", "outputIndexes": +[ 2615 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2612, 2615 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.28/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2616 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2584, 2611, 2616, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.28/self_attn/FusedAttention", "outputIndexes": +[ 2617 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2617 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.28/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3693 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3693 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.28/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3694 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3694 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3451162906, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.28/self_attn/o_proj/Linear", "outputIndexes": +[ 3695 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3695 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3696 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3696 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.28/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2618 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2538, 2618 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/Add_output_0", "outputIndexes": +[ 2619 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2619 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3460600112, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.28/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2620 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2620 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.28/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3697 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3697 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.28/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3698 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3698 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3460632880, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.28/mlp/gate_proj/Linear", "outputIndexes": +[ 3699 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3699 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3700 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3700 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.28/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2621 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2621 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.28/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2622 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3698 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3493663046, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.28/mlp/up_proj/Linear", "outputIndexes": +[ 3703 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3703 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3704 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3704 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.28/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2623 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2622, 2623 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/mlp/Mul_output_0", "outputIndexes": +[ 2624 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2624 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.28/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3705 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3705 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.28/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3706 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3706 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3526693212, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.28/mlp/down_proj/Linear", "outputIndexes": +[ 3707 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3707 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.28/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3708 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3708 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.28/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2625 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2619, 2625 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.28/Add_1_output_0", "outputIndexes": +[ 2626 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2626, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.29/Reshape_output_0", "outputIndexes": +[ 2627 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2627 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3559723378, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.29/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2628 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2628 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.29/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3709 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3709 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.29/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3710 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3710 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3559756146, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.29/self_attn/q_proj/Linear", "outputIndexes": +[ 3711 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3711 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3712 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3712 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.29/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2629 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2628 ] +, "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_output_0", "outputIndexes": +[ 2630 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2630 ] +, "main_type": "NONE", "name": "Shape3877", "outputIndexes": +[ 2631 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2630 ] +, "main_type": "NONE", "name": "Rank3879", "outputIndexes": +[ 2632 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2632, 2632 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3881", "outputIndexes": +[ 2633 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2633 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3882", "outputIndexes": +[ 2634 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2633, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3884", "outputIndexes": +[ 2635 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2635 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3885", "outputIndexes": +[ 2636 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2631, 2634, 2636, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3888", "outputIndexes": +[ 2637 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2637 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3889", "outputIndexes": +[ 2638 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2638, 2638 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3891", "outputIndexes": +[ 2639 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2630, 2639, 2633 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.29/self_attn/Gather_output_0", "outputIndexes": +[ 2640 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2640, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2641 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2633 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3899", "outputIndexes": +[ 2642 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2635 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3902", "outputIndexes": +[ 2643 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2631, 2642, 2643, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3905", "outputIndexes": +[ 2644 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2644 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3906", "outputIndexes": +[ 2645 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2645 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3907", "outputIndexes": +[ 2646 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2646, 2645 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3908", "outputIndexes": +[ 2647 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2630, 2647, 2633 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.29/self_attn/Gather_1_output_0", "outputIndexes": +[ 2648 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2648, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2649 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2641, 2649, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.29/self_attn/Concat_output_0", "outputIndexes": +[ 2650 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2629, 2650 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.29/self_attn/Reshape_output_0", "outputIndexes": +[ 2651 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Mul_output_0", "outputIndexes": +[ 2652 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651 ] +, "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_2_output_0", "outputIndexes": +[ 2653 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2653 ] +, "main_type": "NONE", "name": "Shape3915", "outputIndexes": +[ 2654 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2653 ] +, "main_type": "NONE", "name": "Rank3917", "outputIndexes": +[ 2655 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2655, 2655 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3919", "outputIndexes": +[ 2656 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2656 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3920", "outputIndexes": +[ 2657 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2656, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3922", "outputIndexes": +[ 2658 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2658 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3923", "outputIndexes": +[ 2659 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2654, 2657, 2659, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3926", "outputIndexes": +[ 2660 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2660 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3927", "outputIndexes": +[ 2661 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2661 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3928", "outputIndexes": +[ 2662 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2662, 2661 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3929", "outputIndexes": +[ 2663 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2653, 2663, 2656 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.29/self_attn/Gather_2_output_0", "outputIndexes": +[ 2664 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2664, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Div_output_0", "outputIndexes": +[ 2665 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2665, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2666 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651, 2666, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.29/self_attn/Slice_1_output_0", "outputIndexes": +[ 2667 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2667 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.29/self_attn/Neg_output_0", "outputIndexes": +[ 2668 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2665, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2669 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651, 20, 2669, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.29/self_attn/Slice_output_0", "outputIndexes": +[ 2670 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2668, 2670 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.29/self_attn/Concat_3_output_0", "outputIndexes": +[ 2671 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2671, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Mul_1_output_0", "outputIndexes": +[ 2672 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2652, 2672 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Add_output_0", "outputIndexes": +[ 2673 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3710 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3569193352, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.29/self_attn/k_proj/Linear", "outputIndexes": +[ 3715 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3715 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3716 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3716 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.29/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2674 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2640, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2675 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2648, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2676 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2675, 2676, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.29/self_attn/Concat_1_output_0", "outputIndexes": +[ 2677 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2674, 2677 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.29/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2678 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2678, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Mul_2_output_0", "outputIndexes": +[ 2679 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2678 ] +, "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_3_output_0", "outputIndexes": +[ 2680 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2680 ] +, "main_type": "NONE", "name": "Shape3948", "outputIndexes": +[ 2681 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2680 ] +, "main_type": "NONE", "name": "Rank3950", "outputIndexes": +[ 2682 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2682, 2682 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3952", "outputIndexes": +[ 2683 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2683 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3953", "outputIndexes": +[ 2684 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2683, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3955", "outputIndexes": +[ 2685 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2685 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3956", "outputIndexes": +[ 2686 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2681, 2684, 2686, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3959", "outputIndexes": +[ 2687 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2687 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3960", "outputIndexes": +[ 2688 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2688 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3961", "outputIndexes": +[ 2689 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2689, 2688 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3962", "outputIndexes": +[ 2690 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2680, 2690, 2683 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.29/self_attn/Gather_3_output_0", "outputIndexes": +[ 2691 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2691, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Div_1_output_0", "outputIndexes": +[ 2692 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2692, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2693 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2678, 2693, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.29/self_attn/Slice_3_output_0", "outputIndexes": +[ 2694 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2694 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.29/self_attn/Neg_1_output_0", "outputIndexes": +[ 2695 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2692, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2696 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2678, 20, 2696, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.29/self_attn/Slice_2_output_0", "outputIndexes": +[ 2697 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2695, 2697 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.29/self_attn/Concat_4_output_0", "outputIndexes": +[ 2698 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2698, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Mul_3_output_0", "outputIndexes": +[ 2699 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2679, 2699 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/self_attn/Add_1_output_0", "outputIndexes": +[ 2700 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3710 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3571552670, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.29/self_attn/v_proj/Linear", "outputIndexes": +[ 3719 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3719 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3720 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3720 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.29/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2701 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2640, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2702 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2648, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.29/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2703 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2702, 2703, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.29/self_attn/Concat_2_output_0", "outputIndexes": +[ 2704 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2701, 2704 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.29/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2705 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2673, 2700, 2705, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.29/self_attn/FusedAttention", "outputIndexes": +[ 2706 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2706 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.29/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3721 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3721 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.29/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3722 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3722 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3573911988, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.29/self_attn/o_proj/Linear", "outputIndexes": +[ 3723 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3723 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3724 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3724 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.29/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2707 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2627, 2707 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/Add_output_0", "outputIndexes": +[ 2708 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2708 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3583349194, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.29/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2709 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2709 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.29/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3725 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3725 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.29/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3726 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3726 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3583381962, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.29/mlp/gate_proj/Linear", "outputIndexes": +[ 3727 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3727 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3728 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3728 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.29/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2710 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2710 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.29/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2711 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3726 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3616412128, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.29/mlp/up_proj/Linear", "outputIndexes": +[ 3731 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3731 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3732 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3732 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.29/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2712 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2711, 2712 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/mlp/Mul_output_0", "outputIndexes": +[ 2713 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2713 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.29/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3733 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3733 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.29/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3734 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3734 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3649442294, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.29/mlp/down_proj/Linear", "outputIndexes": +[ 3735 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3735 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.29/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3736 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3736 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.29/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2714 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2708, 2714 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.29/Add_1_output_0", "outputIndexes": +[ 2715 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2715, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.30/Reshape_output_0", "outputIndexes": +[ 2716 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2716 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3682472460, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.30/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2717 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2717 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.30/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3737 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3737 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.30/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3738 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3738 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3682505228, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.30/self_attn/q_proj/Linear", "outputIndexes": +[ 3739 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3739 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3740 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3740 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.30/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2718 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2717 ] +, "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_output_0", "outputIndexes": +[ 2719 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2719 ] +, "main_type": "NONE", "name": "Shape4008", "outputIndexes": +[ 2720 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2719 ] +, "main_type": "NONE", "name": "Rank4010", "outputIndexes": +[ 2721 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2721, 2721 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4012", "outputIndexes": +[ 2722 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2722 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4013", "outputIndexes": +[ 2723 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2722, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4015", "outputIndexes": +[ 2724 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2724 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4016", "outputIndexes": +[ 2725 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2720, 2723, 2725, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4019", "outputIndexes": +[ 2726 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2726 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4020", "outputIndexes": +[ 2727 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2727, 2727 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4022", "outputIndexes": +[ 2728 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2719, 2728, 2722 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.30/self_attn/Gather_output_0", "outputIndexes": +[ 2729 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2729, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2730 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2722 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4030", "outputIndexes": +[ 2731 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2724 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4033", "outputIndexes": +[ 2732 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2720, 2731, 2732, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4036", "outputIndexes": +[ 2733 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2733 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4037", "outputIndexes": +[ 2734 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2734 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4038", "outputIndexes": +[ 2735 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2735, 2734 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4039", "outputIndexes": +[ 2736 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2719, 2736, 2722 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.30/self_attn/Gather_1_output_0", "outputIndexes": +[ 2737 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2737, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2738 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2730, 2738, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.30/self_attn/Concat_output_0", "outputIndexes": +[ 2739 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2718, 2739 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.30/self_attn/Reshape_output_0", "outputIndexes": +[ 2740 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2740, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Mul_output_0", "outputIndexes": +[ 2741 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2740 ] +, "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_2_output_0", "outputIndexes": +[ 2742 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2742 ] +, "main_type": "NONE", "name": "Shape4046", "outputIndexes": +[ 2743 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2742 ] +, "main_type": "NONE", "name": "Rank4048", "outputIndexes": +[ 2744 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2744, 2744 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4050", "outputIndexes": +[ 2745 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2745 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4051", "outputIndexes": +[ 2746 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2745, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4053", "outputIndexes": +[ 2747 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2747 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4054", "outputIndexes": +[ 2748 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2743, 2746, 2748, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4057", "outputIndexes": +[ 2749 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2749 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4058", "outputIndexes": +[ 2750 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2750 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4059", "outputIndexes": +[ 2751 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2751, 2750 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4060", "outputIndexes": +[ 2752 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2742, 2752, 2745 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.30/self_attn/Gather_2_output_0", "outputIndexes": +[ 2753 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2753, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Div_output_0", "outputIndexes": +[ 2754 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2754, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2755 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2740, 2755, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.30/self_attn/Slice_1_output_0", "outputIndexes": +[ 2756 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2756 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.30/self_attn/Neg_output_0", "outputIndexes": +[ 2757 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2754, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2758 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2740, 20, 2758, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.30/self_attn/Slice_output_0", "outputIndexes": +[ 2759 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2757, 2759 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.30/self_attn/Concat_3_output_0", "outputIndexes": +[ 2760 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2760, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Mul_1_output_0", "outputIndexes": +[ 2761 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2741, 2761 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Add_output_0", "outputIndexes": +[ 2762 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3738 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3691942434, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.30/self_attn/k_proj/Linear", "outputIndexes": +[ 3743 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3743 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3744 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3744 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.30/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2763 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2729, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2764 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2737, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2765 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2764, 2765, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.30/self_attn/Concat_1_output_0", "outputIndexes": +[ 2766 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2763, 2766 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.30/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2767 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Mul_2_output_0", "outputIndexes": +[ 2768 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767 ] +, "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_3_output_0", "outputIndexes": +[ 2769 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2769 ] +, "main_type": "NONE", "name": "Shape4079", "outputIndexes": +[ 2770 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2769 ] +, "main_type": "NONE", "name": "Rank4081", "outputIndexes": +[ 2771 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2771, 2771 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4083", "outputIndexes": +[ 2772 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2772 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4084", "outputIndexes": +[ 2773 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2772, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4086", "outputIndexes": +[ 2774 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2774 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4087", "outputIndexes": +[ 2775 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2770, 2773, 2775, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4090", "outputIndexes": +[ 2776 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2776 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4091", "outputIndexes": +[ 2777 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2777 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4092", "outputIndexes": +[ 2778 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2778, 2777 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4093", "outputIndexes": +[ 2779 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2769, 2779, 2772 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.30/self_attn/Gather_3_output_0", "outputIndexes": +[ 2780 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2780, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Div_1_output_0", "outputIndexes": +[ 2781 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2781, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2782 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767, 2782, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.30/self_attn/Slice_3_output_0", "outputIndexes": +[ 2783 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2783 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.30/self_attn/Neg_1_output_0", "outputIndexes": +[ 2784 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2781, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2785 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767, 20, 2785, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.30/self_attn/Slice_2_output_0", "outputIndexes": +[ 2786 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2784, 2786 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.30/self_attn/Concat_4_output_0", "outputIndexes": +[ 2787 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2787, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Mul_3_output_0", "outputIndexes": +[ 2788 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2768, 2788 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/self_attn/Add_1_output_0", "outputIndexes": +[ 2789 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3738 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3694301752, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.30/self_attn/v_proj/Linear", "outputIndexes": +[ 3747 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3747 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3748 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3748 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.30/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2790 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2729, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2791 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2737, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.30/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2792 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2791, 2792, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.30/self_attn/Concat_2_output_0", "outputIndexes": +[ 2793 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2790, 2793 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.30/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2794 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2762, 2789, 2794, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.30/self_attn/FusedAttention", "outputIndexes": +[ 2795 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2795 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.30/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3749 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3749 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.30/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3750 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3750 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3696661070, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.30/self_attn/o_proj/Linear", "outputIndexes": +[ 3751 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3751 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3752 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3752 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.30/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2796 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2716, 2796 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/Add_output_0", "outputIndexes": +[ 2797 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2797 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3706098276, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.30/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2798 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2798 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.30/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3753 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3753 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.30/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3754 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3754 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3706131044, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.30/mlp/gate_proj/Linear", "outputIndexes": +[ 3755 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3755 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3756 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3756 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.30/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2799 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2799 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.30/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2800 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3754 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3739161210, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.30/mlp/up_proj/Linear", "outputIndexes": +[ 3759 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3759 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3760 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3760 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.30/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2801 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2800, 2801 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/mlp/Mul_output_0", "outputIndexes": +[ 2802 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2802 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.30/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3761 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3761 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.30/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3762 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3762 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3772191376, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.30/mlp/down_proj/Linear", "outputIndexes": +[ 3763 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3763 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.30/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3764 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3764 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.30/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2803 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2797, 2803 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.30/Add_1_output_0", "outputIndexes": +[ 2804 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2804, 3 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.31/Reshape_output_0", "outputIndexes": +[ 2805 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2805 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3805221542, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.31/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2806 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2806 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.31/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3765 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3765 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.31/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3766 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3766 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3805254310, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.31/self_attn/q_proj/Linear", "outputIndexes": +[ 3767 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3767 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3768 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3768 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.31/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2807 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2806 ] +, "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_output_0", "outputIndexes": +[ 2808 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2808 ] +, "main_type": "NONE", "name": "Shape4139", "outputIndexes": +[ 2809 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2808 ] +, "main_type": "NONE", "name": "Rank4141", "outputIndexes": +[ 2810 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2810, 2810 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4143", "outputIndexes": +[ 2811 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2811 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4144", "outputIndexes": +[ 2812 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2811, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4146", "outputIndexes": +[ 2813 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2813 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4147", "outputIndexes": +[ 2814 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2809, 2812, 2814, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4150", "outputIndexes": +[ 2815 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2815 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4151", "outputIndexes": +[ 2816 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2816, 2816 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4153", "outputIndexes": +[ 2817 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2808, 2817, 2811 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.31/self_attn/Gather_output_0", "outputIndexes": +[ 2818 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2818, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2819 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2811 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4161", "outputIndexes": +[ 2820 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2813 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4164", "outputIndexes": +[ 2821 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2809, 2820, 2821, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4167", "outputIndexes": +[ 2822 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2822 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4168", "outputIndexes": +[ 2823 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 2823 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4169", "outputIndexes": +[ 2824 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2824, 2823 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4170", "outputIndexes": +[ 2825 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2808, 2825, 2811 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.31/self_attn/Gather_1_output_0", "outputIndexes": +[ 2826 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2826, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2827 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2819, 2827, 30, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.31/self_attn/Concat_output_0", "outputIndexes": +[ 2828 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2807, 2828 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.31/self_attn/Reshape_output_0", "outputIndexes": +[ 2829 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2829, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Mul_output_0", "outputIndexes": +[ 2830 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2829 ] +, "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_2_output_0", "outputIndexes": +[ 2831 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2831 ] +, "main_type": "NONE", "name": "Shape4177", "outputIndexes": +[ 2832 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2831 ] +, "main_type": "NONE", "name": "Rank4179", "outputIndexes": +[ 2833 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2833, 2833 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4181", "outputIndexes": +[ 2834 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2834 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4182", "outputIndexes": +[ 2835 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2834, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4184", "outputIndexes": +[ 2836 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2836 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4185", "outputIndexes": +[ 2837 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2832, 2835, 2837, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4188", "outputIndexes": +[ 2838 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2838 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4189", "outputIndexes": +[ 2839 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2839 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4190", "outputIndexes": +[ 2840 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2840, 2839 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4191", "outputIndexes": +[ 2841 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2831, 2841, 2834 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.31/self_attn/Gather_2_output_0", "outputIndexes": +[ 2842 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2842, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Div_output_0", "outputIndexes": +[ 2843 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2843, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2844 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2829, 2844, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.31/self_attn/Slice_1_output_0", "outputIndexes": +[ 2845 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2845 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.31/self_attn/Neg_output_0", "outputIndexes": +[ 2846 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2843, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2847 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2829, 20, 2847, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.31/self_attn/Slice_output_0", "outputIndexes": +[ 2848 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2846, 2848 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.31/self_attn/Concat_3_output_0", "outputIndexes": +[ 2849 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2849, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Mul_1_output_0", "outputIndexes": +[ 2850 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2830, 2850 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Add_output_0", "outputIndexes": +[ 2851 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3766 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3814691516, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.31/self_attn/k_proj/Linear", "outputIndexes": +[ 3771 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3771 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3772 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3772 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.31/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2852 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2818, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2853 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2826, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2854 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2853, 2854, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.31/self_attn/Concat_1_output_0", "outputIndexes": +[ 2855 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2852, 2855 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.31/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2856 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2856, 57 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Mul_2_output_0", "outputIndexes": +[ 2857 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2856 ] +, "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_3_output_0", "outputIndexes": +[ 2858 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2858 ] +, "main_type": "NONE", "name": "Shape4210", "outputIndexes": +[ 2859 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2858 ] +, "main_type": "NONE", "name": "Rank4212", "outputIndexes": +[ 2860 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2860, 2860 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4214", "outputIndexes": +[ 2861 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2861 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4215", "outputIndexes": +[ 2862 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2861, 12 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4217", "outputIndexes": +[ 2863 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2863 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4218", "outputIndexes": +[ 2864 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2859, 2862, 2864, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4221", "outputIndexes": +[ 2865 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2865 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4222", "outputIndexes": +[ 2866 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60, 2866 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4223", "outputIndexes": +[ 2867 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2867, 2866 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4224", "outputIndexes": +[ 2868 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2858, 2868, 2861 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.31/self_attn/Gather_3_output_0", "outputIndexes": +[ 2869 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2869, 72 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Div_1_output_0", "outputIndexes": +[ 2870 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2870, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2871 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2856, 2871, 75, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.31/self_attn/Slice_3_output_0", "outputIndexes": +[ 2872 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2872 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.31/self_attn/Neg_1_output_0", "outputIndexes": +[ 2873 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2870, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2874 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2856, 20, 2874, 76, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.31/self_attn/Slice_2_output_0", "outputIndexes": +[ 2875 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2873, 2875 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.31/self_attn/Concat_4_output_0", "outputIndexes": +[ 2876 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2876, 88 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Mul_3_output_0", "outputIndexes": +[ 2877 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2857, 2877 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/self_attn/Add_1_output_0", "outputIndexes": +[ 2878 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3766 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3817050834, 2097174, 262144, 0, 0 ] + } +, "name": "/layers.31/self_attn/v_proj/Linear", "outputIndexes": +[ 3775 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3775 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3776 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3776 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.31/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2879 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2818, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2880 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2826, 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.31/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2881 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2880, 2881, 94, 31 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.31/self_attn/Concat_2_output_0", "outputIndexes": +[ 2882 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2879, 2882 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.31/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2883 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2851, 2878, 2883, 124 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "/layers.31/self_attn/FusedAttention", "outputIndexes": +[ 2884 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2884 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.31/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3777 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3777 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.31/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3778 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3778 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3819410152, 8388630, 1048576, 0, 0 ] + } +, "name": "/layers.31/self_attn/o_proj/Linear", "outputIndexes": +[ 3779 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3779 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3780 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3780 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.31/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2885 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2805, 2885 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/Add_output_0", "outputIndexes": +[ 2886 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2886 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3828847358, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "/blocks.31/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2887 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2887 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.31/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3781 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3781 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.31/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3782 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3782 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3828880126, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.31/mlp/gate_proj/Linear", "outputIndexes": +[ 3783 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3783 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3784 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3784 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.31/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2888 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2888 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SILU", "T": "DT_INVALID" } +, "name": "/blocks.31/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2889 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3782 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3861910292, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.31/mlp/up_proj/Linear", "outputIndexes": +[ 3787 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3787 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3788 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3788 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 14336 ] +, "dimType": "NCHW" } +, "name": "/layers.31/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2890 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2889, 2890 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/mlp/Mul_output_0", "outputIndexes": +[ 2891 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2891 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 14336, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.31/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3789 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3789 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.31/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3790 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3790 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 3894940458, 29360150, 3670016, 0, 0 ] + } +, "name": "/layers.31/mlp/down_proj/Linear", "outputIndexes": +[ 3791 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3791 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.31/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3792 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3792 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 4096 ] +, "dimType": "NCHW" } +, "name": "/layers.31/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2892 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2886, 2892 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.31/Add_1_output_0", "outputIndexes": +[ 2893 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2893, 1, 75, 15, 15 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/Slice_output_0", "outputIndexes": +[ 2894 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2894 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.00001, "group": 1, "external": +[ 3927970624, 16384, 16384 ] +, "useRMSNorm": true } +, "name": "hidden_states", "outputIndexes": +[ 2895 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2895 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 4096, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": +[ 3793 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3793 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": +[ 3794 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3794 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128256, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4104192, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } +, "external": +[ 3928003392, 262668314, 32833536, 0, 0 ] + } +, "name": "/lm/lm_head/Linear", "outputIndexes": +[ 3795 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3795 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": +[ 3796 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3796 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 128256 ] +, "dimType": "NCHW" } +, "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": +[ 2896 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } + ] +, "outputName": +[ "logits", "hidden_states" ] +, "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": +[ "position_ids", "logits_index", "input_ids", "/blocks.0/Constant_output_0", "/blocks.0/Reshape_output_0", "/blocks.0/input_layernorm/Mul_1_output_0", "/blocks.0/self_attn/q_proj/FakeLinear_output_0", "/blocks.0/self_attn/Shape_output_0", "Shape21", "Rank23", "BinaryOp25", "Unsqueeze26", "Const27", "BinaryOp28", "Unsqueeze29", "Unsqueeze31", "StridedSlice32", "Squeeze33", "BinaryOp35", "/blocks.0/self_attn/Gather_output_0", "/rotary/Constant_3_output_0", "/blocks.0/self_attn/Unsqueeze_output_0", "Unsqueeze45", "Unsqueeze48", "StridedSlice51", "Squeeze52", "BinaryOp53", "BinaryOp54", "/blocks.0/self_attn/Gather_1_output_0", "/blocks.0/self_attn/Unsqueeze_1_output_0", "/blocks.0/self_attn/Constant_2_output_0", "/blocks.0/self_attn/Constant_3_output_0", "/blocks.0/self_attn/Concat_output_0", "/blocks.0/self_attn/Reshape_output_0", "/rotary/Cast_output_0", "/rotary/Constant_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_1_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_5_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape76", "Rank78", "BinaryOp80", "Unsqueeze81", "BinaryOp83", "Unsqueeze84", "StridedSlice87", "Squeeze88", "BinaryOp90", "/blocks.0/self_attn/Gather_2_output_0", "/blocks.0/self_attn/Mul_output_0", "/blocks.0/self_attn/Shape_2_output_0", "/blocks.0/self_attn/Constant_8_output_0", "Shape95", "Rank97", "BinaryOp99", "Unsqueeze100", "BinaryOp102", "Unsqueeze103", "StridedSlice106", "Squeeze107", "BinaryOp108", "BinaryOp109", "/blocks.0/self_attn/Gather_4_output_0", "/blocks.0/self_attn/Constant_9_output_0", "/blocks.0/self_attn/Div_output_0", "/blocks.0/self_attn/Unsqueeze_7_output_0", "/blocks.0/self_attn/Constant_16_output_0", "/blocks.0/self_attn/Constant_10_output_0", "/blocks.0/self_attn/Slice_1_output_0", "/blocks.0/self_attn/Neg_output_0", "/blocks.0/self_attn/Unsqueeze_6_output_0", "/blocks.0/self_attn/Slice_output_0", "/blocks.0/self_attn/Concat_3_output_0", "Unsqueeze127", "Unsqueeze130", "StridedSlice133", "Squeeze134", "BinaryOp135", "BinaryOp136", "/blocks.0/self_attn/Gather_3_output_0", "/blocks.0/self_attn/Mul_1_output_0", "/blocks.0/self_attn/Add_output_0", "/blocks.0/self_attn/k_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_2_output_0", "/blocks.0/self_attn/Unsqueeze_3_output_0", "/blocks.0/self_attn/Constant_4_output_0", "/blocks.0/self_attn/Concat_1_output_0", "/blocks.0/self_attn/Reshape_1_output_0", "/blocks.0/self_attn/Mul_2_output_0", "/blocks.0/self_attn/Shape_3_output_0", "Shape148", "Rank150", "BinaryOp152", "Unsqueeze153", "BinaryOp155", "Unsqueeze156", "StridedSlice159", "Squeeze160", "BinaryOp161", "BinaryOp162", "/blocks.0/self_attn/Gather_5_output_0", "/blocks.0/self_attn/Div_1_output_0", "/blocks.0/self_attn/Unsqueeze_9_output_0", "/blocks.0/self_attn/Slice_3_output_0", "/blocks.0/self_attn/Neg_1_output_0", "/blocks.0/self_attn/Unsqueeze_8_output_0", "/blocks.0/self_attn/Slice_2_output_0", "/blocks.0/self_attn/Concat_4_output_0", "/blocks.0/self_attn/Mul_3_output_0", "/blocks.0/self_attn/Add_1_output_0", "/blocks.0/self_attn/v_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_4_output_0", "/blocks.0/self_attn/Unsqueeze_5_output_0", "/blocks.0/self_attn/Concat_2_output_0", "/blocks.0/self_attn/Reshape_2_output_0", "attention_mask", "/blocks.0/self_attn/fused_attn/FusedAttention_output_0", "/blocks.0/self_attn/o_proj/FakeLinear_output_0", "/blocks.0/Add_output_0", "/blocks.0/post_attention_layernorm/Mul_1_output_0", "/blocks.0/mlp/gate_proj/FakeLinear_output_0", "/blocks.0/mlp/act_fn/Mul_output_0", "/blocks.0/mlp/up_proj/FakeLinear_output_0", "/blocks.0/mlp/Mul_output_0", "/blocks.0/mlp/down_proj/FakeLinear_output_0", "/blocks.0/Add_1_output_0", "/blocks.1/Reshape_output_0", "/blocks.1/input_layernorm/Mul_1_output_0", "/blocks.1/self_attn/q_proj/FakeLinear_output_0", "/blocks.1/self_attn/Shape_output_0", "Shape209", "Rank211", "BinaryOp213", "Unsqueeze214", "BinaryOp216", "Unsqueeze217", "StridedSlice220", "Squeeze221", "BinaryOp223", "/blocks.1/self_attn/Gather_output_0", "/blocks.1/self_attn/Unsqueeze_output_0", "Unsqueeze231", "Unsqueeze234", "StridedSlice237", "Squeeze238", "BinaryOp239", "BinaryOp240", "/blocks.1/self_attn/Gather_1_output_0", "/blocks.1/self_attn/Unsqueeze_1_output_0", "/blocks.1/self_attn/Concat_output_0", "/blocks.1/self_attn/Reshape_output_0", "/blocks.1/self_attn/Mul_output_0", "/blocks.1/self_attn/Shape_2_output_0", "Shape247", "Rank249", "BinaryOp251", "Unsqueeze252", "BinaryOp254", "Unsqueeze255", "StridedSlice258", "Squeeze259", "BinaryOp260", "BinaryOp261", "/blocks.1/self_attn/Gather_2_output_0", "/blocks.1/self_attn/Div_output_0", "/blocks.1/self_attn/Unsqueeze_7_output_0", "/blocks.1/self_attn/Slice_1_output_0", "/blocks.1/self_attn/Neg_output_0", "/blocks.1/self_attn/Unsqueeze_6_output_0", "/blocks.1/self_attn/Slice_output_0", "/blocks.1/self_attn/Concat_3_output_0", "/blocks.1/self_attn/Mul_1_output_0", "/blocks.1/self_attn/Add_output_0", "/blocks.1/self_attn/k_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_2_output_0", "/blocks.1/self_attn/Unsqueeze_3_output_0", "/blocks.1/self_attn/Concat_1_output_0", "/blocks.1/self_attn/Reshape_1_output_0", "/blocks.1/self_attn/Mul_2_output_0", "/blocks.1/self_attn/Shape_3_output_0", "Shape280", "Rank282", "BinaryOp284", "Unsqueeze285", "BinaryOp287", "Unsqueeze288", "StridedSlice291", "Squeeze292", "BinaryOp293", "BinaryOp294", "/blocks.1/self_attn/Gather_3_output_0", "/blocks.1/self_attn/Div_1_output_0", "/blocks.1/self_attn/Unsqueeze_9_output_0", "/blocks.1/self_attn/Slice_3_output_0", "/blocks.1/self_attn/Neg_1_output_0", "/blocks.1/self_attn/Unsqueeze_8_output_0", "/blocks.1/self_attn/Slice_2_output_0", "/blocks.1/self_attn/Concat_4_output_0", "/blocks.1/self_attn/Mul_3_output_0", "/blocks.1/self_attn/Add_1_output_0", "/blocks.1/self_attn/v_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_4_output_0", "/blocks.1/self_attn/Unsqueeze_5_output_0", "/blocks.1/self_attn/Concat_2_output_0", "/blocks.1/self_attn/Reshape_2_output_0", "/blocks.1/self_attn/fused_attn/FusedAttention_output_0", "/blocks.1/self_attn/o_proj/FakeLinear_output_0", "/blocks.1/Add_output_0", "/blocks.1/post_attention_layernorm/Mul_1_output_0", "/blocks.1/mlp/gate_proj/FakeLinear_output_0", "/blocks.1/mlp/act_fn/Mul_output_0", "/blocks.1/mlp/up_proj/FakeLinear_output_0", "/blocks.1/mlp/Mul_output_0", "/blocks.1/mlp/down_proj/FakeLinear_output_0", "/blocks.1/Add_1_output_0", "/blocks.2/Reshape_output_0", "/blocks.2/input_layernorm/Mul_1_output_0", "/blocks.2/self_attn/q_proj/FakeLinear_output_0", "/blocks.2/self_attn/Shape_output_0", "Shape340", "Rank342", "BinaryOp344", "Unsqueeze345", "BinaryOp347", "Unsqueeze348", "StridedSlice351", "Squeeze352", "BinaryOp354", "/blocks.2/self_attn/Gather_output_0", "/blocks.2/self_attn/Unsqueeze_output_0", "Unsqueeze362", "Unsqueeze365", "StridedSlice368", "Squeeze369", "BinaryOp370", "BinaryOp371", "/blocks.2/self_attn/Gather_1_output_0", "/blocks.2/self_attn/Unsqueeze_1_output_0", "/blocks.2/self_attn/Concat_output_0", "/blocks.2/self_attn/Reshape_output_0", "/blocks.2/self_attn/Mul_output_0", "/blocks.2/self_attn/Shape_2_output_0", "Shape378", "Rank380", "BinaryOp382", "Unsqueeze383", "BinaryOp385", "Unsqueeze386", "StridedSlice389", "Squeeze390", "BinaryOp391", "BinaryOp392", "/blocks.2/self_attn/Gather_2_output_0", "/blocks.2/self_attn/Div_output_0", "/blocks.2/self_attn/Unsqueeze_7_output_0", "/blocks.2/self_attn/Slice_1_output_0", "/blocks.2/self_attn/Neg_output_0", "/blocks.2/self_attn/Unsqueeze_6_output_0", "/blocks.2/self_attn/Slice_output_0", "/blocks.2/self_attn/Concat_3_output_0", "/blocks.2/self_attn/Mul_1_output_0", "/blocks.2/self_attn/Add_output_0", "/blocks.2/self_attn/k_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_2_output_0", "/blocks.2/self_attn/Unsqueeze_3_output_0", "/blocks.2/self_attn/Concat_1_output_0", "/blocks.2/self_attn/Reshape_1_output_0", "/blocks.2/self_attn/Mul_2_output_0", "/blocks.2/self_attn/Shape_3_output_0", "Shape411", "Rank413", "BinaryOp415", "Unsqueeze416", "BinaryOp418", "Unsqueeze419", "StridedSlice422", "Squeeze423", "BinaryOp424", "BinaryOp425", "/blocks.2/self_attn/Gather_3_output_0", "/blocks.2/self_attn/Div_1_output_0", "/blocks.2/self_attn/Unsqueeze_9_output_0", "/blocks.2/self_attn/Slice_3_output_0", "/blocks.2/self_attn/Neg_1_output_0", "/blocks.2/self_attn/Unsqueeze_8_output_0", "/blocks.2/self_attn/Slice_2_output_0", "/blocks.2/self_attn/Concat_4_output_0", "/blocks.2/self_attn/Mul_3_output_0", "/blocks.2/self_attn/Add_1_output_0", "/blocks.2/self_attn/v_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_4_output_0", "/blocks.2/self_attn/Unsqueeze_5_output_0", "/blocks.2/self_attn/Concat_2_output_0", "/blocks.2/self_attn/Reshape_2_output_0", "/blocks.2/self_attn/fused_attn/FusedAttention_output_0", "/blocks.2/self_attn/o_proj/FakeLinear_output_0", "/blocks.2/Add_output_0", "/blocks.2/post_attention_layernorm/Mul_1_output_0", "/blocks.2/mlp/gate_proj/FakeLinear_output_0", "/blocks.2/mlp/act_fn/Mul_output_0", "/blocks.2/mlp/up_proj/FakeLinear_output_0", "/blocks.2/mlp/Mul_output_0", "/blocks.2/mlp/down_proj/FakeLinear_output_0", "/blocks.2/Add_1_output_0", "/blocks.3/Reshape_output_0", "/blocks.3/input_layernorm/Mul_1_output_0", "/blocks.3/self_attn/q_proj/FakeLinear_output_0", "/blocks.3/self_attn/Shape_output_0", "Shape471", "Rank473", "BinaryOp475", "Unsqueeze476", "BinaryOp478", "Unsqueeze479", "StridedSlice482", "Squeeze483", "BinaryOp485", "/blocks.3/self_attn/Gather_output_0", "/blocks.3/self_attn/Unsqueeze_output_0", "Unsqueeze493", "Unsqueeze496", "StridedSlice499", "Squeeze500", "BinaryOp501", "BinaryOp502", "/blocks.3/self_attn/Gather_1_output_0", "/blocks.3/self_attn/Unsqueeze_1_output_0", "/blocks.3/self_attn/Concat_output_0", "/blocks.3/self_attn/Reshape_output_0", "/blocks.3/self_attn/Mul_output_0", "/blocks.3/self_attn/Shape_2_output_0", "Shape509", "Rank511", "BinaryOp513", "Unsqueeze514", "BinaryOp516", "Unsqueeze517", "StridedSlice520", "Squeeze521", "BinaryOp522", "BinaryOp523", "/blocks.3/self_attn/Gather_2_output_0", "/blocks.3/self_attn/Div_output_0", "/blocks.3/self_attn/Unsqueeze_7_output_0", "/blocks.3/self_attn/Slice_1_output_0", "/blocks.3/self_attn/Neg_output_0", "/blocks.3/self_attn/Unsqueeze_6_output_0", "/blocks.3/self_attn/Slice_output_0", "/blocks.3/self_attn/Concat_3_output_0", "/blocks.3/self_attn/Mul_1_output_0", "/blocks.3/self_attn/Add_output_0", "/blocks.3/self_attn/k_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_2_output_0", "/blocks.3/self_attn/Unsqueeze_3_output_0", "/blocks.3/self_attn/Concat_1_output_0", "/blocks.3/self_attn/Reshape_1_output_0", "/blocks.3/self_attn/Mul_2_output_0", "/blocks.3/self_attn/Shape_3_output_0", "Shape542", "Rank544", "BinaryOp546", "Unsqueeze547", "BinaryOp549", "Unsqueeze550", "StridedSlice553", "Squeeze554", "BinaryOp555", "BinaryOp556", "/blocks.3/self_attn/Gather_3_output_0", "/blocks.3/self_attn/Div_1_output_0", "/blocks.3/self_attn/Unsqueeze_9_output_0", "/blocks.3/self_attn/Slice_3_output_0", "/blocks.3/self_attn/Neg_1_output_0", "/blocks.3/self_attn/Unsqueeze_8_output_0", "/blocks.3/self_attn/Slice_2_output_0", "/blocks.3/self_attn/Concat_4_output_0", "/blocks.3/self_attn/Mul_3_output_0", "/blocks.3/self_attn/Add_1_output_0", "/blocks.3/self_attn/v_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_4_output_0", "/blocks.3/self_attn/Unsqueeze_5_output_0", "/blocks.3/self_attn/Concat_2_output_0", "/blocks.3/self_attn/Reshape_2_output_0", "/blocks.3/self_attn/fused_attn/FusedAttention_output_0", "/blocks.3/self_attn/o_proj/FakeLinear_output_0", "/blocks.3/Add_output_0", "/blocks.3/post_attention_layernorm/Mul_1_output_0", "/blocks.3/mlp/gate_proj/FakeLinear_output_0", "/blocks.3/mlp/act_fn/Mul_output_0", "/blocks.3/mlp/up_proj/FakeLinear_output_0", "/blocks.3/mlp/Mul_output_0", "/blocks.3/mlp/down_proj/FakeLinear_output_0", "/blocks.3/Add_1_output_0", "/blocks.4/Reshape_output_0", "/blocks.4/input_layernorm/Mul_1_output_0", "/blocks.4/self_attn/q_proj/FakeLinear_output_0", "/blocks.4/self_attn/Shape_output_0", "Shape602", "Rank604", "BinaryOp606", "Unsqueeze607", "BinaryOp609", "Unsqueeze610", "StridedSlice613", "Squeeze614", "BinaryOp616", "/blocks.4/self_attn/Gather_output_0", "/blocks.4/self_attn/Unsqueeze_output_0", "Unsqueeze624", "Unsqueeze627", "StridedSlice630", "Squeeze631", "BinaryOp632", "BinaryOp633", "/blocks.4/self_attn/Gather_1_output_0", "/blocks.4/self_attn/Unsqueeze_1_output_0", "/blocks.4/self_attn/Concat_output_0", "/blocks.4/self_attn/Reshape_output_0", "/blocks.4/self_attn/Mul_output_0", "/blocks.4/self_attn/Shape_2_output_0", "Shape640", "Rank642", "BinaryOp644", "Unsqueeze645", "BinaryOp647", "Unsqueeze648", "StridedSlice651", "Squeeze652", "BinaryOp653", "BinaryOp654", "/blocks.4/self_attn/Gather_2_output_0", "/blocks.4/self_attn/Div_output_0", "/blocks.4/self_attn/Unsqueeze_7_output_0", "/blocks.4/self_attn/Slice_1_output_0", "/blocks.4/self_attn/Neg_output_0", "/blocks.4/self_attn/Unsqueeze_6_output_0", "/blocks.4/self_attn/Slice_output_0", "/blocks.4/self_attn/Concat_3_output_0", "/blocks.4/self_attn/Mul_1_output_0", "/blocks.4/self_attn/Add_output_0", "/blocks.4/self_attn/k_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_2_output_0", "/blocks.4/self_attn/Unsqueeze_3_output_0", "/blocks.4/self_attn/Concat_1_output_0", "/blocks.4/self_attn/Reshape_1_output_0", "/blocks.4/self_attn/Mul_2_output_0", "/blocks.4/self_attn/Shape_3_output_0", "Shape673", "Rank675", "BinaryOp677", "Unsqueeze678", "BinaryOp680", "Unsqueeze681", "StridedSlice684", "Squeeze685", "BinaryOp686", "BinaryOp687", "/blocks.4/self_attn/Gather_3_output_0", "/blocks.4/self_attn/Div_1_output_0", "/blocks.4/self_attn/Unsqueeze_9_output_0", "/blocks.4/self_attn/Slice_3_output_0", "/blocks.4/self_attn/Neg_1_output_0", "/blocks.4/self_attn/Unsqueeze_8_output_0", "/blocks.4/self_attn/Slice_2_output_0", "/blocks.4/self_attn/Concat_4_output_0", "/blocks.4/self_attn/Mul_3_output_0", "/blocks.4/self_attn/Add_1_output_0", "/blocks.4/self_attn/v_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_4_output_0", "/blocks.4/self_attn/Unsqueeze_5_output_0", "/blocks.4/self_attn/Concat_2_output_0", "/blocks.4/self_attn/Reshape_2_output_0", "/blocks.4/self_attn/fused_attn/FusedAttention_output_0", "/blocks.4/self_attn/o_proj/FakeLinear_output_0", "/blocks.4/Add_output_0", "/blocks.4/post_attention_layernorm/Mul_1_output_0", "/blocks.4/mlp/gate_proj/FakeLinear_output_0", "/blocks.4/mlp/act_fn/Mul_output_0", "/blocks.4/mlp/up_proj/FakeLinear_output_0", "/blocks.4/mlp/Mul_output_0", "/blocks.4/mlp/down_proj/FakeLinear_output_0", "/blocks.4/Add_1_output_0", "/blocks.5/Reshape_output_0", "/blocks.5/input_layernorm/Mul_1_output_0", "/blocks.5/self_attn/q_proj/FakeLinear_output_0", "/blocks.5/self_attn/Shape_output_0", "Shape733", "Rank735", "BinaryOp737", "Unsqueeze738", "BinaryOp740", "Unsqueeze741", "StridedSlice744", "Squeeze745", "BinaryOp747", "/blocks.5/self_attn/Gather_output_0", "/blocks.5/self_attn/Unsqueeze_output_0", "Unsqueeze755", "Unsqueeze758", "StridedSlice761", "Squeeze762", "BinaryOp763", "BinaryOp764", "/blocks.5/self_attn/Gather_1_output_0", "/blocks.5/self_attn/Unsqueeze_1_output_0", "/blocks.5/self_attn/Concat_output_0", "/blocks.5/self_attn/Reshape_output_0", "/blocks.5/self_attn/Mul_output_0", "/blocks.5/self_attn/Shape_2_output_0", "Shape771", "Rank773", "BinaryOp775", "Unsqueeze776", "BinaryOp778", "Unsqueeze779", "StridedSlice782", "Squeeze783", "BinaryOp784", "BinaryOp785", "/blocks.5/self_attn/Gather_2_output_0", "/blocks.5/self_attn/Div_output_0", "/blocks.5/self_attn/Unsqueeze_7_output_0", "/blocks.5/self_attn/Slice_1_output_0", "/blocks.5/self_attn/Neg_output_0", "/blocks.5/self_attn/Unsqueeze_6_output_0", "/blocks.5/self_attn/Slice_output_0", "/blocks.5/self_attn/Concat_3_output_0", "/blocks.5/self_attn/Mul_1_output_0", "/blocks.5/self_attn/Add_output_0", "/blocks.5/self_attn/k_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_2_output_0", "/blocks.5/self_attn/Unsqueeze_3_output_0", "/blocks.5/self_attn/Concat_1_output_0", "/blocks.5/self_attn/Reshape_1_output_0", "/blocks.5/self_attn/Mul_2_output_0", "/blocks.5/self_attn/Shape_3_output_0", "Shape804", "Rank806", "BinaryOp808", "Unsqueeze809", "BinaryOp811", "Unsqueeze812", "StridedSlice815", "Squeeze816", "BinaryOp817", "BinaryOp818", "/blocks.5/self_attn/Gather_3_output_0", "/blocks.5/self_attn/Div_1_output_0", "/blocks.5/self_attn/Unsqueeze_9_output_0", "/blocks.5/self_attn/Slice_3_output_0", "/blocks.5/self_attn/Neg_1_output_0", "/blocks.5/self_attn/Unsqueeze_8_output_0", "/blocks.5/self_attn/Slice_2_output_0", "/blocks.5/self_attn/Concat_4_output_0", "/blocks.5/self_attn/Mul_3_output_0", "/blocks.5/self_attn/Add_1_output_0", "/blocks.5/self_attn/v_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_4_output_0", "/blocks.5/self_attn/Unsqueeze_5_output_0", "/blocks.5/self_attn/Concat_2_output_0", "/blocks.5/self_attn/Reshape_2_output_0", "/blocks.5/self_attn/fused_attn/FusedAttention_output_0", "/blocks.5/self_attn/o_proj/FakeLinear_output_0", "/blocks.5/Add_output_0", "/blocks.5/post_attention_layernorm/Mul_1_output_0", "/blocks.5/mlp/gate_proj/FakeLinear_output_0", "/blocks.5/mlp/act_fn/Mul_output_0", "/blocks.5/mlp/up_proj/FakeLinear_output_0", "/blocks.5/mlp/Mul_output_0", "/blocks.5/mlp/down_proj/FakeLinear_output_0", "/blocks.5/Add_1_output_0", "/blocks.6/Reshape_output_0", "/blocks.6/input_layernorm/Mul_1_output_0", "/blocks.6/self_attn/q_proj/FakeLinear_output_0", "/blocks.6/self_attn/Shape_output_0", "Shape864", "Rank866", "BinaryOp868", "Unsqueeze869", "BinaryOp871", "Unsqueeze872", "StridedSlice875", "Squeeze876", "BinaryOp878", "/blocks.6/self_attn/Gather_output_0", "/blocks.6/self_attn/Unsqueeze_output_0", "Unsqueeze886", "Unsqueeze889", "StridedSlice892", "Squeeze893", "BinaryOp894", "BinaryOp895", "/blocks.6/self_attn/Gather_1_output_0", "/blocks.6/self_attn/Unsqueeze_1_output_0", "/blocks.6/self_attn/Concat_output_0", "/blocks.6/self_attn/Reshape_output_0", "/blocks.6/self_attn/Mul_output_0", "/blocks.6/self_attn/Shape_2_output_0", "Shape902", "Rank904", "BinaryOp906", "Unsqueeze907", "BinaryOp909", "Unsqueeze910", "StridedSlice913", "Squeeze914", "BinaryOp915", "BinaryOp916", "/blocks.6/self_attn/Gather_2_output_0", "/blocks.6/self_attn/Div_output_0", "/blocks.6/self_attn/Unsqueeze_7_output_0", "/blocks.6/self_attn/Slice_1_output_0", "/blocks.6/self_attn/Neg_output_0", "/blocks.6/self_attn/Unsqueeze_6_output_0", "/blocks.6/self_attn/Slice_output_0", "/blocks.6/self_attn/Concat_3_output_0", "/blocks.6/self_attn/Mul_1_output_0", "/blocks.6/self_attn/Add_output_0", "/blocks.6/self_attn/k_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_2_output_0", "/blocks.6/self_attn/Unsqueeze_3_output_0", "/blocks.6/self_attn/Concat_1_output_0", "/blocks.6/self_attn/Reshape_1_output_0", "/blocks.6/self_attn/Mul_2_output_0", "/blocks.6/self_attn/Shape_3_output_0", "Shape935", "Rank937", "BinaryOp939", "Unsqueeze940", "BinaryOp942", "Unsqueeze943", "StridedSlice946", "Squeeze947", "BinaryOp948", "BinaryOp949", "/blocks.6/self_attn/Gather_3_output_0", "/blocks.6/self_attn/Div_1_output_0", "/blocks.6/self_attn/Unsqueeze_9_output_0", "/blocks.6/self_attn/Slice_3_output_0", "/blocks.6/self_attn/Neg_1_output_0", "/blocks.6/self_attn/Unsqueeze_8_output_0", "/blocks.6/self_attn/Slice_2_output_0", "/blocks.6/self_attn/Concat_4_output_0", "/blocks.6/self_attn/Mul_3_output_0", "/blocks.6/self_attn/Add_1_output_0", "/blocks.6/self_attn/v_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_4_output_0", "/blocks.6/self_attn/Unsqueeze_5_output_0", "/blocks.6/self_attn/Concat_2_output_0", "/blocks.6/self_attn/Reshape_2_output_0", "/blocks.6/self_attn/fused_attn/FusedAttention_output_0", "/blocks.6/self_attn/o_proj/FakeLinear_output_0", "/blocks.6/Add_output_0", "/blocks.6/post_attention_layernorm/Mul_1_output_0", "/blocks.6/mlp/gate_proj/FakeLinear_output_0", "/blocks.6/mlp/act_fn/Mul_output_0", "/blocks.6/mlp/up_proj/FakeLinear_output_0", "/blocks.6/mlp/Mul_output_0", "/blocks.6/mlp/down_proj/FakeLinear_output_0", "/blocks.6/Add_1_output_0", "/blocks.7/Reshape_output_0", "/blocks.7/input_layernorm/Mul_1_output_0", "/blocks.7/self_attn/q_proj/FakeLinear_output_0", "/blocks.7/self_attn/Shape_output_0", "Shape995", "Rank997", "BinaryOp999", "Unsqueeze1000", "BinaryOp1002", "Unsqueeze1003", "StridedSlice1006", "Squeeze1007", "BinaryOp1009", "/blocks.7/self_attn/Gather_output_0", "/blocks.7/self_attn/Unsqueeze_output_0", "Unsqueeze1017", "Unsqueeze1020", "StridedSlice1023", "Squeeze1024", "BinaryOp1025", "BinaryOp1026", "/blocks.7/self_attn/Gather_1_output_0", "/blocks.7/self_attn/Unsqueeze_1_output_0", "/blocks.7/self_attn/Concat_output_0", "/blocks.7/self_attn/Reshape_output_0", "/blocks.7/self_attn/Mul_output_0", "/blocks.7/self_attn/Shape_2_output_0", "Shape1033", "Rank1035", "BinaryOp1037", "Unsqueeze1038", "BinaryOp1040", "Unsqueeze1041", "StridedSlice1044", "Squeeze1045", "BinaryOp1046", "BinaryOp1047", "/blocks.7/self_attn/Gather_2_output_0", "/blocks.7/self_attn/Div_output_0", "/blocks.7/self_attn/Unsqueeze_7_output_0", "/blocks.7/self_attn/Slice_1_output_0", "/blocks.7/self_attn/Neg_output_0", "/blocks.7/self_attn/Unsqueeze_6_output_0", "/blocks.7/self_attn/Slice_output_0", "/blocks.7/self_attn/Concat_3_output_0", "/blocks.7/self_attn/Mul_1_output_0", "/blocks.7/self_attn/Add_output_0", "/blocks.7/self_attn/k_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_2_output_0", "/blocks.7/self_attn/Unsqueeze_3_output_0", "/blocks.7/self_attn/Concat_1_output_0", "/blocks.7/self_attn/Reshape_1_output_0", "/blocks.7/self_attn/Mul_2_output_0", "/blocks.7/self_attn/Shape_3_output_0", "Shape1066", "Rank1068", "BinaryOp1070", "Unsqueeze1071", "BinaryOp1073", "Unsqueeze1074", "StridedSlice1077", "Squeeze1078", "BinaryOp1079", "BinaryOp1080", "/blocks.7/self_attn/Gather_3_output_0", "/blocks.7/self_attn/Div_1_output_0", "/blocks.7/self_attn/Unsqueeze_9_output_0", "/blocks.7/self_attn/Slice_3_output_0", "/blocks.7/self_attn/Neg_1_output_0", "/blocks.7/self_attn/Unsqueeze_8_output_0", "/blocks.7/self_attn/Slice_2_output_0", "/blocks.7/self_attn/Concat_4_output_0", "/blocks.7/self_attn/Mul_3_output_0", "/blocks.7/self_attn/Add_1_output_0", "/blocks.7/self_attn/v_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_4_output_0", "/blocks.7/self_attn/Unsqueeze_5_output_0", "/blocks.7/self_attn/Concat_2_output_0", "/blocks.7/self_attn/Reshape_2_output_0", "/blocks.7/self_attn/fused_attn/FusedAttention_output_0", "/blocks.7/self_attn/o_proj/FakeLinear_output_0", "/blocks.7/Add_output_0", "/blocks.7/post_attention_layernorm/Mul_1_output_0", "/blocks.7/mlp/gate_proj/FakeLinear_output_0", "/blocks.7/mlp/act_fn/Mul_output_0", "/blocks.7/mlp/up_proj/FakeLinear_output_0", "/blocks.7/mlp/Mul_output_0", "/blocks.7/mlp/down_proj/FakeLinear_output_0", "/blocks.7/Add_1_output_0", "/blocks.8/Reshape_output_0", "/blocks.8/input_layernorm/Mul_1_output_0", "/blocks.8/self_attn/q_proj/FakeLinear_output_0", "/blocks.8/self_attn/Shape_output_0", "Shape1126", "Rank1128", "BinaryOp1130", "Unsqueeze1131", "BinaryOp1133", "Unsqueeze1134", "StridedSlice1137", "Squeeze1138", "BinaryOp1140", "/blocks.8/self_attn/Gather_output_0", "/blocks.8/self_attn/Unsqueeze_output_0", "Unsqueeze1148", "Unsqueeze1151", "StridedSlice1154", "Squeeze1155", "BinaryOp1156", "BinaryOp1157", "/blocks.8/self_attn/Gather_1_output_0", "/blocks.8/self_attn/Unsqueeze_1_output_0", "/blocks.8/self_attn/Concat_output_0", "/blocks.8/self_attn/Reshape_output_0", "/blocks.8/self_attn/Mul_output_0", "/blocks.8/self_attn/Shape_2_output_0", "Shape1164", "Rank1166", "BinaryOp1168", "Unsqueeze1169", "BinaryOp1171", "Unsqueeze1172", "StridedSlice1175", "Squeeze1176", "BinaryOp1177", "BinaryOp1178", "/blocks.8/self_attn/Gather_2_output_0", "/blocks.8/self_attn/Div_output_0", "/blocks.8/self_attn/Unsqueeze_7_output_0", "/blocks.8/self_attn/Slice_1_output_0", "/blocks.8/self_attn/Neg_output_0", "/blocks.8/self_attn/Unsqueeze_6_output_0", "/blocks.8/self_attn/Slice_output_0", "/blocks.8/self_attn/Concat_3_output_0", "/blocks.8/self_attn/Mul_1_output_0", "/blocks.8/self_attn/Add_output_0", "/blocks.8/self_attn/k_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_2_output_0", "/blocks.8/self_attn/Unsqueeze_3_output_0", "/blocks.8/self_attn/Concat_1_output_0", "/blocks.8/self_attn/Reshape_1_output_0", "/blocks.8/self_attn/Mul_2_output_0", "/blocks.8/self_attn/Shape_3_output_0", "Shape1197", "Rank1199", "BinaryOp1201", "Unsqueeze1202", "BinaryOp1204", "Unsqueeze1205", "StridedSlice1208", "Squeeze1209", "BinaryOp1210", "BinaryOp1211", "/blocks.8/self_attn/Gather_3_output_0", "/blocks.8/self_attn/Div_1_output_0", "/blocks.8/self_attn/Unsqueeze_9_output_0", "/blocks.8/self_attn/Slice_3_output_0", "/blocks.8/self_attn/Neg_1_output_0", "/blocks.8/self_attn/Unsqueeze_8_output_0", "/blocks.8/self_attn/Slice_2_output_0", "/blocks.8/self_attn/Concat_4_output_0", "/blocks.8/self_attn/Mul_3_output_0", "/blocks.8/self_attn/Add_1_output_0", "/blocks.8/self_attn/v_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_4_output_0", "/blocks.8/self_attn/Unsqueeze_5_output_0", "/blocks.8/self_attn/Concat_2_output_0", "/blocks.8/self_attn/Reshape_2_output_0", "/blocks.8/self_attn/fused_attn/FusedAttention_output_0", "/blocks.8/self_attn/o_proj/FakeLinear_output_0", "/blocks.8/Add_output_0", "/blocks.8/post_attention_layernorm/Mul_1_output_0", "/blocks.8/mlp/gate_proj/FakeLinear_output_0", "/blocks.8/mlp/act_fn/Mul_output_0", "/blocks.8/mlp/up_proj/FakeLinear_output_0", "/blocks.8/mlp/Mul_output_0", "/blocks.8/mlp/down_proj/FakeLinear_output_0", "/blocks.8/Add_1_output_0", "/blocks.9/Reshape_output_0", "/blocks.9/input_layernorm/Mul_1_output_0", "/blocks.9/self_attn/q_proj/FakeLinear_output_0", "/blocks.9/self_attn/Shape_output_0", "Shape1257", "Rank1259", "BinaryOp1261", "Unsqueeze1262", "BinaryOp1264", "Unsqueeze1265", "StridedSlice1268", "Squeeze1269", "BinaryOp1271", "/blocks.9/self_attn/Gather_output_0", "/blocks.9/self_attn/Unsqueeze_output_0", "Unsqueeze1279", "Unsqueeze1282", "StridedSlice1285", "Squeeze1286", "BinaryOp1287", "BinaryOp1288", "/blocks.9/self_attn/Gather_1_output_0", "/blocks.9/self_attn/Unsqueeze_1_output_0", "/blocks.9/self_attn/Concat_output_0", "/blocks.9/self_attn/Reshape_output_0", "/blocks.9/self_attn/Mul_output_0", "/blocks.9/self_attn/Shape_2_output_0", "Shape1295", "Rank1297", "BinaryOp1299", "Unsqueeze1300", "BinaryOp1302", "Unsqueeze1303", "StridedSlice1306", "Squeeze1307", "BinaryOp1308", "BinaryOp1309", "/blocks.9/self_attn/Gather_2_output_0", "/blocks.9/self_attn/Div_output_0", "/blocks.9/self_attn/Unsqueeze_7_output_0", "/blocks.9/self_attn/Slice_1_output_0", "/blocks.9/self_attn/Neg_output_0", "/blocks.9/self_attn/Unsqueeze_6_output_0", "/blocks.9/self_attn/Slice_output_0", "/blocks.9/self_attn/Concat_3_output_0", "/blocks.9/self_attn/Mul_1_output_0", "/blocks.9/self_attn/Add_output_0", "/blocks.9/self_attn/k_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_2_output_0", "/blocks.9/self_attn/Unsqueeze_3_output_0", "/blocks.9/self_attn/Concat_1_output_0", "/blocks.9/self_attn/Reshape_1_output_0", "/blocks.9/self_attn/Mul_2_output_0", "/blocks.9/self_attn/Shape_3_output_0", "Shape1328", "Rank1330", "BinaryOp1332", "Unsqueeze1333", "BinaryOp1335", "Unsqueeze1336", "StridedSlice1339", "Squeeze1340", "BinaryOp1341", "BinaryOp1342", "/blocks.9/self_attn/Gather_3_output_0", "/blocks.9/self_attn/Div_1_output_0", "/blocks.9/self_attn/Unsqueeze_9_output_0", "/blocks.9/self_attn/Slice_3_output_0", "/blocks.9/self_attn/Neg_1_output_0", "/blocks.9/self_attn/Unsqueeze_8_output_0", "/blocks.9/self_attn/Slice_2_output_0", "/blocks.9/self_attn/Concat_4_output_0", "/blocks.9/self_attn/Mul_3_output_0", "/blocks.9/self_attn/Add_1_output_0", "/blocks.9/self_attn/v_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_4_output_0", "/blocks.9/self_attn/Unsqueeze_5_output_0", "/blocks.9/self_attn/Concat_2_output_0", "/blocks.9/self_attn/Reshape_2_output_0", "/blocks.9/self_attn/fused_attn/FusedAttention_output_0", "/blocks.9/self_attn/o_proj/FakeLinear_output_0", "/blocks.9/Add_output_0", "/blocks.9/post_attention_layernorm/Mul_1_output_0", "/blocks.9/mlp/gate_proj/FakeLinear_output_0", "/blocks.9/mlp/act_fn/Mul_output_0", "/blocks.9/mlp/up_proj/FakeLinear_output_0", "/blocks.9/mlp/Mul_output_0", "/blocks.9/mlp/down_proj/FakeLinear_output_0", "/blocks.9/Add_1_output_0", "/blocks.10/Reshape_output_0", "/blocks.10/input_layernorm/Mul_1_output_0", "/blocks.10/self_attn/q_proj/FakeLinear_output_0", "/blocks.10/self_attn/Shape_output_0", "Shape1388", "Rank1390", "BinaryOp1392", "Unsqueeze1393", "BinaryOp1395", "Unsqueeze1396", "StridedSlice1399", "Squeeze1400", "BinaryOp1402", "/blocks.10/self_attn/Gather_output_0", "/blocks.10/self_attn/Unsqueeze_output_0", "Unsqueeze1410", "Unsqueeze1413", "StridedSlice1416", "Squeeze1417", "BinaryOp1418", "BinaryOp1419", "/blocks.10/self_attn/Gather_1_output_0", "/blocks.10/self_attn/Unsqueeze_1_output_0", "/blocks.10/self_attn/Concat_output_0", "/blocks.10/self_attn/Reshape_output_0", "/blocks.10/self_attn/Mul_output_0", "/blocks.10/self_attn/Shape_2_output_0", "Shape1426", "Rank1428", "BinaryOp1430", "Unsqueeze1431", "BinaryOp1433", "Unsqueeze1434", "StridedSlice1437", "Squeeze1438", "BinaryOp1439", "BinaryOp1440", "/blocks.10/self_attn/Gather_2_output_0", "/blocks.10/self_attn/Div_output_0", "/blocks.10/self_attn/Unsqueeze_7_output_0", "/blocks.10/self_attn/Slice_1_output_0", "/blocks.10/self_attn/Neg_output_0", "/blocks.10/self_attn/Unsqueeze_6_output_0", "/blocks.10/self_attn/Slice_output_0", "/blocks.10/self_attn/Concat_3_output_0", "/blocks.10/self_attn/Mul_1_output_0", "/blocks.10/self_attn/Add_output_0", "/blocks.10/self_attn/k_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_2_output_0", "/blocks.10/self_attn/Unsqueeze_3_output_0", "/blocks.10/self_attn/Concat_1_output_0", "/blocks.10/self_attn/Reshape_1_output_0", "/blocks.10/self_attn/Mul_2_output_0", "/blocks.10/self_attn/Shape_3_output_0", "Shape1459", "Rank1461", "BinaryOp1463", "Unsqueeze1464", "BinaryOp1466", "Unsqueeze1467", "StridedSlice1470", "Squeeze1471", "BinaryOp1472", "BinaryOp1473", "/blocks.10/self_attn/Gather_3_output_0", "/blocks.10/self_attn/Div_1_output_0", "/blocks.10/self_attn/Unsqueeze_9_output_0", "/blocks.10/self_attn/Slice_3_output_0", "/blocks.10/self_attn/Neg_1_output_0", "/blocks.10/self_attn/Unsqueeze_8_output_0", "/blocks.10/self_attn/Slice_2_output_0", "/blocks.10/self_attn/Concat_4_output_0", "/blocks.10/self_attn/Mul_3_output_0", "/blocks.10/self_attn/Add_1_output_0", "/blocks.10/self_attn/v_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_4_output_0", "/blocks.10/self_attn/Unsqueeze_5_output_0", "/blocks.10/self_attn/Concat_2_output_0", "/blocks.10/self_attn/Reshape_2_output_0", "/blocks.10/self_attn/fused_attn/FusedAttention_output_0", "/blocks.10/self_attn/o_proj/FakeLinear_output_0", "/blocks.10/Add_output_0", "/blocks.10/post_attention_layernorm/Mul_1_output_0", "/blocks.10/mlp/gate_proj/FakeLinear_output_0", "/blocks.10/mlp/act_fn/Mul_output_0", "/blocks.10/mlp/up_proj/FakeLinear_output_0", "/blocks.10/mlp/Mul_output_0", "/blocks.10/mlp/down_proj/FakeLinear_output_0", "/blocks.10/Add_1_output_0", "/blocks.11/Reshape_output_0", "/blocks.11/input_layernorm/Mul_1_output_0", "/blocks.11/self_attn/q_proj/FakeLinear_output_0", "/blocks.11/self_attn/Shape_output_0", "Shape1519", "Rank1521", "BinaryOp1523", "Unsqueeze1524", "BinaryOp1526", "Unsqueeze1527", "StridedSlice1530", "Squeeze1531", "BinaryOp1533", "/blocks.11/self_attn/Gather_output_0", "/blocks.11/self_attn/Unsqueeze_output_0", "Unsqueeze1541", "Unsqueeze1544", "StridedSlice1547", "Squeeze1548", "BinaryOp1549", "BinaryOp1550", "/blocks.11/self_attn/Gather_1_output_0", "/blocks.11/self_attn/Unsqueeze_1_output_0", "/blocks.11/self_attn/Concat_output_0", "/blocks.11/self_attn/Reshape_output_0", "/blocks.11/self_attn/Mul_output_0", "/blocks.11/self_attn/Shape_2_output_0", "Shape1557", "Rank1559", "BinaryOp1561", "Unsqueeze1562", "BinaryOp1564", "Unsqueeze1565", "StridedSlice1568", "Squeeze1569", "BinaryOp1570", "BinaryOp1571", "/blocks.11/self_attn/Gather_2_output_0", "/blocks.11/self_attn/Div_output_0", "/blocks.11/self_attn/Unsqueeze_7_output_0", "/blocks.11/self_attn/Slice_1_output_0", "/blocks.11/self_attn/Neg_output_0", "/blocks.11/self_attn/Unsqueeze_6_output_0", "/blocks.11/self_attn/Slice_output_0", "/blocks.11/self_attn/Concat_3_output_0", "/blocks.11/self_attn/Mul_1_output_0", "/blocks.11/self_attn/Add_output_0", "/blocks.11/self_attn/k_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_2_output_0", "/blocks.11/self_attn/Unsqueeze_3_output_0", "/blocks.11/self_attn/Concat_1_output_0", "/blocks.11/self_attn/Reshape_1_output_0", "/blocks.11/self_attn/Mul_2_output_0", "/blocks.11/self_attn/Shape_3_output_0", "Shape1590", "Rank1592", "BinaryOp1594", "Unsqueeze1595", "BinaryOp1597", "Unsqueeze1598", "StridedSlice1601", "Squeeze1602", "BinaryOp1603", "BinaryOp1604", "/blocks.11/self_attn/Gather_3_output_0", "/blocks.11/self_attn/Div_1_output_0", "/blocks.11/self_attn/Unsqueeze_9_output_0", "/blocks.11/self_attn/Slice_3_output_0", "/blocks.11/self_attn/Neg_1_output_0", "/blocks.11/self_attn/Unsqueeze_8_output_0", "/blocks.11/self_attn/Slice_2_output_0", "/blocks.11/self_attn/Concat_4_output_0", "/blocks.11/self_attn/Mul_3_output_0", "/blocks.11/self_attn/Add_1_output_0", "/blocks.11/self_attn/v_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_4_output_0", "/blocks.11/self_attn/Unsqueeze_5_output_0", "/blocks.11/self_attn/Concat_2_output_0", "/blocks.11/self_attn/Reshape_2_output_0", "/blocks.11/self_attn/fused_attn/FusedAttention_output_0", "/blocks.11/self_attn/o_proj/FakeLinear_output_0", "/blocks.11/Add_output_0", "/blocks.11/post_attention_layernorm/Mul_1_output_0", "/blocks.11/mlp/gate_proj/FakeLinear_output_0", "/blocks.11/mlp/act_fn/Mul_output_0", "/blocks.11/mlp/up_proj/FakeLinear_output_0", "/blocks.11/mlp/Mul_output_0", "/blocks.11/mlp/down_proj/FakeLinear_output_0", "/blocks.11/Add_1_output_0", "/blocks.12/Reshape_output_0", "/blocks.12/input_layernorm/Mul_1_output_0", "/blocks.12/self_attn/q_proj/FakeLinear_output_0", "/blocks.12/self_attn/Shape_output_0", "Shape1650", "Rank1652", "BinaryOp1654", "Unsqueeze1655", "BinaryOp1657", "Unsqueeze1658", "StridedSlice1661", "Squeeze1662", "BinaryOp1664", "/blocks.12/self_attn/Gather_output_0", "/blocks.12/self_attn/Unsqueeze_output_0", "Unsqueeze1672", "Unsqueeze1675", "StridedSlice1678", "Squeeze1679", "BinaryOp1680", "BinaryOp1681", "/blocks.12/self_attn/Gather_1_output_0", "/blocks.12/self_attn/Unsqueeze_1_output_0", "/blocks.12/self_attn/Concat_output_0", "/blocks.12/self_attn/Reshape_output_0", "/blocks.12/self_attn/Mul_output_0", "/blocks.12/self_attn/Shape_2_output_0", "Shape1688", "Rank1690", "BinaryOp1692", "Unsqueeze1693", "BinaryOp1695", "Unsqueeze1696", "StridedSlice1699", "Squeeze1700", "BinaryOp1701", "BinaryOp1702", "/blocks.12/self_attn/Gather_2_output_0", "/blocks.12/self_attn/Div_output_0", "/blocks.12/self_attn/Unsqueeze_7_output_0", "/blocks.12/self_attn/Slice_1_output_0", "/blocks.12/self_attn/Neg_output_0", "/blocks.12/self_attn/Unsqueeze_6_output_0", "/blocks.12/self_attn/Slice_output_0", "/blocks.12/self_attn/Concat_3_output_0", "/blocks.12/self_attn/Mul_1_output_0", "/blocks.12/self_attn/Add_output_0", "/blocks.12/self_attn/k_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_2_output_0", "/blocks.12/self_attn/Unsqueeze_3_output_0", "/blocks.12/self_attn/Concat_1_output_0", "/blocks.12/self_attn/Reshape_1_output_0", "/blocks.12/self_attn/Mul_2_output_0", "/blocks.12/self_attn/Shape_3_output_0", "Shape1721", "Rank1723", "BinaryOp1725", "Unsqueeze1726", "BinaryOp1728", "Unsqueeze1729", "StridedSlice1732", "Squeeze1733", "BinaryOp1734", "BinaryOp1735", "/blocks.12/self_attn/Gather_3_output_0", "/blocks.12/self_attn/Div_1_output_0", "/blocks.12/self_attn/Unsqueeze_9_output_0", "/blocks.12/self_attn/Slice_3_output_0", "/blocks.12/self_attn/Neg_1_output_0", "/blocks.12/self_attn/Unsqueeze_8_output_0", "/blocks.12/self_attn/Slice_2_output_0", "/blocks.12/self_attn/Concat_4_output_0", "/blocks.12/self_attn/Mul_3_output_0", "/blocks.12/self_attn/Add_1_output_0", "/blocks.12/self_attn/v_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_4_output_0", "/blocks.12/self_attn/Unsqueeze_5_output_0", "/blocks.12/self_attn/Concat_2_output_0", "/blocks.12/self_attn/Reshape_2_output_0", "/blocks.12/self_attn/fused_attn/FusedAttention_output_0", "/blocks.12/self_attn/o_proj/FakeLinear_output_0", "/blocks.12/Add_output_0", "/blocks.12/post_attention_layernorm/Mul_1_output_0", "/blocks.12/mlp/gate_proj/FakeLinear_output_0", "/blocks.12/mlp/act_fn/Mul_output_0", "/blocks.12/mlp/up_proj/FakeLinear_output_0", "/blocks.12/mlp/Mul_output_0", "/blocks.12/mlp/down_proj/FakeLinear_output_0", "/blocks.12/Add_1_output_0", "/blocks.13/Reshape_output_0", "/blocks.13/input_layernorm/Mul_1_output_0", "/blocks.13/self_attn/q_proj/FakeLinear_output_0", "/blocks.13/self_attn/Shape_output_0", "Shape1781", "Rank1783", "BinaryOp1785", "Unsqueeze1786", "BinaryOp1788", "Unsqueeze1789", "StridedSlice1792", "Squeeze1793", "BinaryOp1795", "/blocks.13/self_attn/Gather_output_0", "/blocks.13/self_attn/Unsqueeze_output_0", "Unsqueeze1803", "Unsqueeze1806", "StridedSlice1809", "Squeeze1810", "BinaryOp1811", "BinaryOp1812", "/blocks.13/self_attn/Gather_1_output_0", "/blocks.13/self_attn/Unsqueeze_1_output_0", "/blocks.13/self_attn/Concat_output_0", "/blocks.13/self_attn/Reshape_output_0", "/blocks.13/self_attn/Mul_output_0", "/blocks.13/self_attn/Shape_2_output_0", "Shape1819", "Rank1821", "BinaryOp1823", "Unsqueeze1824", "BinaryOp1826", "Unsqueeze1827", "StridedSlice1830", "Squeeze1831", "BinaryOp1832", "BinaryOp1833", "/blocks.13/self_attn/Gather_2_output_0", "/blocks.13/self_attn/Div_output_0", "/blocks.13/self_attn/Unsqueeze_7_output_0", "/blocks.13/self_attn/Slice_1_output_0", "/blocks.13/self_attn/Neg_output_0", "/blocks.13/self_attn/Unsqueeze_6_output_0", "/blocks.13/self_attn/Slice_output_0", "/blocks.13/self_attn/Concat_3_output_0", "/blocks.13/self_attn/Mul_1_output_0", "/blocks.13/self_attn/Add_output_0", "/blocks.13/self_attn/k_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_2_output_0", "/blocks.13/self_attn/Unsqueeze_3_output_0", "/blocks.13/self_attn/Concat_1_output_0", "/blocks.13/self_attn/Reshape_1_output_0", "/blocks.13/self_attn/Mul_2_output_0", "/blocks.13/self_attn/Shape_3_output_0", "Shape1852", "Rank1854", "BinaryOp1856", "Unsqueeze1857", "BinaryOp1859", "Unsqueeze1860", "StridedSlice1863", "Squeeze1864", "BinaryOp1865", "BinaryOp1866", "/blocks.13/self_attn/Gather_3_output_0", "/blocks.13/self_attn/Div_1_output_0", "/blocks.13/self_attn/Unsqueeze_9_output_0", "/blocks.13/self_attn/Slice_3_output_0", "/blocks.13/self_attn/Neg_1_output_0", "/blocks.13/self_attn/Unsqueeze_8_output_0", "/blocks.13/self_attn/Slice_2_output_0", "/blocks.13/self_attn/Concat_4_output_0", "/blocks.13/self_attn/Mul_3_output_0", "/blocks.13/self_attn/Add_1_output_0", "/blocks.13/self_attn/v_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_4_output_0", "/blocks.13/self_attn/Unsqueeze_5_output_0", "/blocks.13/self_attn/Concat_2_output_0", "/blocks.13/self_attn/Reshape_2_output_0", "/blocks.13/self_attn/fused_attn/FusedAttention_output_0", "/blocks.13/self_attn/o_proj/FakeLinear_output_0", "/blocks.13/Add_output_0", "/blocks.13/post_attention_layernorm/Mul_1_output_0", "/blocks.13/mlp/gate_proj/FakeLinear_output_0", "/blocks.13/mlp/act_fn/Mul_output_0", "/blocks.13/mlp/up_proj/FakeLinear_output_0", "/blocks.13/mlp/Mul_output_0", "/blocks.13/mlp/down_proj/FakeLinear_output_0", "/blocks.13/Add_1_output_0", "/blocks.14/Reshape_output_0", "/blocks.14/input_layernorm/Mul_1_output_0", "/blocks.14/self_attn/q_proj/FakeLinear_output_0", "/blocks.14/self_attn/Shape_output_0", "Shape1912", "Rank1914", "BinaryOp1916", "Unsqueeze1917", "BinaryOp1919", "Unsqueeze1920", "StridedSlice1923", "Squeeze1924", "BinaryOp1926", "/blocks.14/self_attn/Gather_output_0", "/blocks.14/self_attn/Unsqueeze_output_0", "Unsqueeze1934", "Unsqueeze1937", "StridedSlice1940", "Squeeze1941", "BinaryOp1942", "BinaryOp1943", "/blocks.14/self_attn/Gather_1_output_0", "/blocks.14/self_attn/Unsqueeze_1_output_0", "/blocks.14/self_attn/Concat_output_0", "/blocks.14/self_attn/Reshape_output_0", "/blocks.14/self_attn/Mul_output_0", "/blocks.14/self_attn/Shape_2_output_0", "Shape1950", "Rank1952", "BinaryOp1954", "Unsqueeze1955", "BinaryOp1957", "Unsqueeze1958", "StridedSlice1961", "Squeeze1962", "BinaryOp1963", "BinaryOp1964", "/blocks.14/self_attn/Gather_2_output_0", "/blocks.14/self_attn/Div_output_0", "/blocks.14/self_attn/Unsqueeze_7_output_0", "/blocks.14/self_attn/Slice_1_output_0", "/blocks.14/self_attn/Neg_output_0", "/blocks.14/self_attn/Unsqueeze_6_output_0", "/blocks.14/self_attn/Slice_output_0", "/blocks.14/self_attn/Concat_3_output_0", "/blocks.14/self_attn/Mul_1_output_0", "/blocks.14/self_attn/Add_output_0", "/blocks.14/self_attn/k_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_2_output_0", "/blocks.14/self_attn/Unsqueeze_3_output_0", "/blocks.14/self_attn/Concat_1_output_0", "/blocks.14/self_attn/Reshape_1_output_0", "/blocks.14/self_attn/Mul_2_output_0", "/blocks.14/self_attn/Shape_3_output_0", "Shape1983", "Rank1985", "BinaryOp1987", "Unsqueeze1988", "BinaryOp1990", "Unsqueeze1991", "StridedSlice1994", "Squeeze1995", "BinaryOp1996", "BinaryOp1997", "/blocks.14/self_attn/Gather_3_output_0", "/blocks.14/self_attn/Div_1_output_0", "/blocks.14/self_attn/Unsqueeze_9_output_0", "/blocks.14/self_attn/Slice_3_output_0", "/blocks.14/self_attn/Neg_1_output_0", "/blocks.14/self_attn/Unsqueeze_8_output_0", "/blocks.14/self_attn/Slice_2_output_0", "/blocks.14/self_attn/Concat_4_output_0", "/blocks.14/self_attn/Mul_3_output_0", "/blocks.14/self_attn/Add_1_output_0", "/blocks.14/self_attn/v_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_4_output_0", "/blocks.14/self_attn/Unsqueeze_5_output_0", "/blocks.14/self_attn/Concat_2_output_0", "/blocks.14/self_attn/Reshape_2_output_0", "/blocks.14/self_attn/fused_attn/FusedAttention_output_0", "/blocks.14/self_attn/o_proj/FakeLinear_output_0", "/blocks.14/Add_output_0", "/blocks.14/post_attention_layernorm/Mul_1_output_0", "/blocks.14/mlp/gate_proj/FakeLinear_output_0", "/blocks.14/mlp/act_fn/Mul_output_0", "/blocks.14/mlp/up_proj/FakeLinear_output_0", "/blocks.14/mlp/Mul_output_0", "/blocks.14/mlp/down_proj/FakeLinear_output_0", "/blocks.14/Add_1_output_0", "/blocks.15/Reshape_output_0", "/blocks.15/input_layernorm/Mul_1_output_0", "/blocks.15/self_attn/q_proj/FakeLinear_output_0", "/blocks.15/self_attn/Shape_output_0", "Shape2043", "Rank2045", "BinaryOp2047", "Unsqueeze2048", "BinaryOp2050", "Unsqueeze2051", "StridedSlice2054", "Squeeze2055", "BinaryOp2057", "/blocks.15/self_attn/Gather_output_0", "/blocks.15/self_attn/Unsqueeze_output_0", "Unsqueeze2065", "Unsqueeze2068", "StridedSlice2071", "Squeeze2072", "BinaryOp2073", "BinaryOp2074", "/blocks.15/self_attn/Gather_1_output_0", "/blocks.15/self_attn/Unsqueeze_1_output_0", "/blocks.15/self_attn/Concat_output_0", "/blocks.15/self_attn/Reshape_output_0", "/blocks.15/self_attn/Mul_output_0", "/blocks.15/self_attn/Shape_2_output_0", "Shape2081", "Rank2083", "BinaryOp2085", "Unsqueeze2086", "BinaryOp2088", "Unsqueeze2089", "StridedSlice2092", "Squeeze2093", "BinaryOp2094", "BinaryOp2095", "/blocks.15/self_attn/Gather_2_output_0", "/blocks.15/self_attn/Div_output_0", "/blocks.15/self_attn/Unsqueeze_7_output_0", "/blocks.15/self_attn/Slice_1_output_0", "/blocks.15/self_attn/Neg_output_0", "/blocks.15/self_attn/Unsqueeze_6_output_0", "/blocks.15/self_attn/Slice_output_0", "/blocks.15/self_attn/Concat_3_output_0", "/blocks.15/self_attn/Mul_1_output_0", "/blocks.15/self_attn/Add_output_0", "/blocks.15/self_attn/k_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_2_output_0", "/blocks.15/self_attn/Unsqueeze_3_output_0", "/blocks.15/self_attn/Concat_1_output_0", "/blocks.15/self_attn/Reshape_1_output_0", "/blocks.15/self_attn/Mul_2_output_0", "/blocks.15/self_attn/Shape_3_output_0", "Shape2114", "Rank2116", "BinaryOp2118", "Unsqueeze2119", "BinaryOp2121", "Unsqueeze2122", "StridedSlice2125", "Squeeze2126", "BinaryOp2127", "BinaryOp2128", "/blocks.15/self_attn/Gather_3_output_0", "/blocks.15/self_attn/Div_1_output_0", "/blocks.15/self_attn/Unsqueeze_9_output_0", "/blocks.15/self_attn/Slice_3_output_0", "/blocks.15/self_attn/Neg_1_output_0", "/blocks.15/self_attn/Unsqueeze_8_output_0", "/blocks.15/self_attn/Slice_2_output_0", "/blocks.15/self_attn/Concat_4_output_0", "/blocks.15/self_attn/Mul_3_output_0", "/blocks.15/self_attn/Add_1_output_0", "/blocks.15/self_attn/v_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_4_output_0", "/blocks.15/self_attn/Unsqueeze_5_output_0", "/blocks.15/self_attn/Concat_2_output_0", "/blocks.15/self_attn/Reshape_2_output_0", "/blocks.15/self_attn/fused_attn/FusedAttention_output_0", "/blocks.15/self_attn/o_proj/FakeLinear_output_0", "/blocks.15/Add_output_0", "/blocks.15/post_attention_layernorm/Mul_1_output_0", "/blocks.15/mlp/gate_proj/FakeLinear_output_0", "/blocks.15/mlp/act_fn/Mul_output_0", "/blocks.15/mlp/up_proj/FakeLinear_output_0", "/blocks.15/mlp/Mul_output_0", "/blocks.15/mlp/down_proj/FakeLinear_output_0", "/blocks.15/Add_1_output_0", "/blocks.16/Reshape_output_0", "/blocks.16/input_layernorm/Mul_1_output_0", "/blocks.16/self_attn/q_proj/FakeLinear_output_0", "/blocks.16/self_attn/Shape_output_0", "Shape2174", "Rank2176", "BinaryOp2178", "Unsqueeze2179", "BinaryOp2181", "Unsqueeze2182", "StridedSlice2185", "Squeeze2186", "BinaryOp2188", "/blocks.16/self_attn/Gather_output_0", "/blocks.16/self_attn/Unsqueeze_output_0", "Unsqueeze2196", "Unsqueeze2199", "StridedSlice2202", "Squeeze2203", "BinaryOp2204", "BinaryOp2205", "/blocks.16/self_attn/Gather_1_output_0", "/blocks.16/self_attn/Unsqueeze_1_output_0", "/blocks.16/self_attn/Concat_output_0", "/blocks.16/self_attn/Reshape_output_0", "/blocks.16/self_attn/Mul_output_0", "/blocks.16/self_attn/Shape_2_output_0", "Shape2212", "Rank2214", "BinaryOp2216", "Unsqueeze2217", "BinaryOp2219", "Unsqueeze2220", "StridedSlice2223", "Squeeze2224", "BinaryOp2225", "BinaryOp2226", "/blocks.16/self_attn/Gather_2_output_0", "/blocks.16/self_attn/Div_output_0", "/blocks.16/self_attn/Unsqueeze_7_output_0", "/blocks.16/self_attn/Slice_1_output_0", "/blocks.16/self_attn/Neg_output_0", "/blocks.16/self_attn/Unsqueeze_6_output_0", "/blocks.16/self_attn/Slice_output_0", "/blocks.16/self_attn/Concat_3_output_0", "/blocks.16/self_attn/Mul_1_output_0", "/blocks.16/self_attn/Add_output_0", "/blocks.16/self_attn/k_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_2_output_0", "/blocks.16/self_attn/Unsqueeze_3_output_0", "/blocks.16/self_attn/Concat_1_output_0", "/blocks.16/self_attn/Reshape_1_output_0", "/blocks.16/self_attn/Mul_2_output_0", "/blocks.16/self_attn/Shape_3_output_0", "Shape2245", "Rank2247", "BinaryOp2249", "Unsqueeze2250", "BinaryOp2252", "Unsqueeze2253", "StridedSlice2256", "Squeeze2257", "BinaryOp2258", "BinaryOp2259", "/blocks.16/self_attn/Gather_3_output_0", "/blocks.16/self_attn/Div_1_output_0", "/blocks.16/self_attn/Unsqueeze_9_output_0", "/blocks.16/self_attn/Slice_3_output_0", "/blocks.16/self_attn/Neg_1_output_0", "/blocks.16/self_attn/Unsqueeze_8_output_0", "/blocks.16/self_attn/Slice_2_output_0", "/blocks.16/self_attn/Concat_4_output_0", "/blocks.16/self_attn/Mul_3_output_0", "/blocks.16/self_attn/Add_1_output_0", "/blocks.16/self_attn/v_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_4_output_0", "/blocks.16/self_attn/Unsqueeze_5_output_0", "/blocks.16/self_attn/Concat_2_output_0", "/blocks.16/self_attn/Reshape_2_output_0", "/blocks.16/self_attn/fused_attn/FusedAttention_output_0", "/blocks.16/self_attn/o_proj/FakeLinear_output_0", "/blocks.16/Add_output_0", "/blocks.16/post_attention_layernorm/Mul_1_output_0", "/blocks.16/mlp/gate_proj/FakeLinear_output_0", "/blocks.16/mlp/act_fn/Mul_output_0", "/blocks.16/mlp/up_proj/FakeLinear_output_0", "/blocks.16/mlp/Mul_output_0", "/blocks.16/mlp/down_proj/FakeLinear_output_0", "/blocks.16/Add_1_output_0", "/blocks.17/Reshape_output_0", "/blocks.17/input_layernorm/Mul_1_output_0", "/blocks.17/self_attn/q_proj/FakeLinear_output_0", "/blocks.17/self_attn/Shape_output_0", "Shape2305", "Rank2307", "BinaryOp2309", "Unsqueeze2310", "BinaryOp2312", "Unsqueeze2313", "StridedSlice2316", "Squeeze2317", "BinaryOp2319", "/blocks.17/self_attn/Gather_output_0", "/blocks.17/self_attn/Unsqueeze_output_0", "Unsqueeze2327", "Unsqueeze2330", "StridedSlice2333", "Squeeze2334", "BinaryOp2335", "BinaryOp2336", "/blocks.17/self_attn/Gather_1_output_0", "/blocks.17/self_attn/Unsqueeze_1_output_0", "/blocks.17/self_attn/Concat_output_0", "/blocks.17/self_attn/Reshape_output_0", "/blocks.17/self_attn/Mul_output_0", "/blocks.17/self_attn/Shape_2_output_0", "Shape2343", "Rank2345", "BinaryOp2347", "Unsqueeze2348", "BinaryOp2350", "Unsqueeze2351", "StridedSlice2354", "Squeeze2355", "BinaryOp2356", "BinaryOp2357", "/blocks.17/self_attn/Gather_2_output_0", "/blocks.17/self_attn/Div_output_0", "/blocks.17/self_attn/Unsqueeze_7_output_0", "/blocks.17/self_attn/Slice_1_output_0", "/blocks.17/self_attn/Neg_output_0", "/blocks.17/self_attn/Unsqueeze_6_output_0", "/blocks.17/self_attn/Slice_output_0", "/blocks.17/self_attn/Concat_3_output_0", "/blocks.17/self_attn/Mul_1_output_0", "/blocks.17/self_attn/Add_output_0", "/blocks.17/self_attn/k_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_2_output_0", "/blocks.17/self_attn/Unsqueeze_3_output_0", "/blocks.17/self_attn/Concat_1_output_0", "/blocks.17/self_attn/Reshape_1_output_0", "/blocks.17/self_attn/Mul_2_output_0", "/blocks.17/self_attn/Shape_3_output_0", "Shape2376", "Rank2378", "BinaryOp2380", "Unsqueeze2381", "BinaryOp2383", "Unsqueeze2384", "StridedSlice2387", "Squeeze2388", "BinaryOp2389", "BinaryOp2390", "/blocks.17/self_attn/Gather_3_output_0", "/blocks.17/self_attn/Div_1_output_0", "/blocks.17/self_attn/Unsqueeze_9_output_0", "/blocks.17/self_attn/Slice_3_output_0", "/blocks.17/self_attn/Neg_1_output_0", "/blocks.17/self_attn/Unsqueeze_8_output_0", "/blocks.17/self_attn/Slice_2_output_0", "/blocks.17/self_attn/Concat_4_output_0", "/blocks.17/self_attn/Mul_3_output_0", "/blocks.17/self_attn/Add_1_output_0", "/blocks.17/self_attn/v_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_4_output_0", "/blocks.17/self_attn/Unsqueeze_5_output_0", "/blocks.17/self_attn/Concat_2_output_0", "/blocks.17/self_attn/Reshape_2_output_0", "/blocks.17/self_attn/fused_attn/FusedAttention_output_0", "/blocks.17/self_attn/o_proj/FakeLinear_output_0", "/blocks.17/Add_output_0", "/blocks.17/post_attention_layernorm/Mul_1_output_0", "/blocks.17/mlp/gate_proj/FakeLinear_output_0", "/blocks.17/mlp/act_fn/Mul_output_0", "/blocks.17/mlp/up_proj/FakeLinear_output_0", "/blocks.17/mlp/Mul_output_0", "/blocks.17/mlp/down_proj/FakeLinear_output_0", "/blocks.17/Add_1_output_0", "/blocks.18/Reshape_output_0", "/blocks.18/input_layernorm/Mul_1_output_0", "/blocks.18/self_attn/q_proj/FakeLinear_output_0", "/blocks.18/self_attn/Shape_output_0", "Shape2436", "Rank2438", "BinaryOp2440", "Unsqueeze2441", "BinaryOp2443", "Unsqueeze2444", "StridedSlice2447", "Squeeze2448", "BinaryOp2450", "/blocks.18/self_attn/Gather_output_0", "/blocks.18/self_attn/Unsqueeze_output_0", "Unsqueeze2458", "Unsqueeze2461", "StridedSlice2464", "Squeeze2465", "BinaryOp2466", "BinaryOp2467", "/blocks.18/self_attn/Gather_1_output_0", "/blocks.18/self_attn/Unsqueeze_1_output_0", "/blocks.18/self_attn/Concat_output_0", "/blocks.18/self_attn/Reshape_output_0", "/blocks.18/self_attn/Mul_output_0", "/blocks.18/self_attn/Shape_2_output_0", "Shape2474", "Rank2476", "BinaryOp2478", "Unsqueeze2479", "BinaryOp2481", "Unsqueeze2482", "StridedSlice2485", "Squeeze2486", "BinaryOp2487", "BinaryOp2488", "/blocks.18/self_attn/Gather_2_output_0", "/blocks.18/self_attn/Div_output_0", "/blocks.18/self_attn/Unsqueeze_7_output_0", "/blocks.18/self_attn/Slice_1_output_0", "/blocks.18/self_attn/Neg_output_0", "/blocks.18/self_attn/Unsqueeze_6_output_0", "/blocks.18/self_attn/Slice_output_0", "/blocks.18/self_attn/Concat_3_output_0", "/blocks.18/self_attn/Mul_1_output_0", "/blocks.18/self_attn/Add_output_0", "/blocks.18/self_attn/k_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_2_output_0", "/blocks.18/self_attn/Unsqueeze_3_output_0", "/blocks.18/self_attn/Concat_1_output_0", "/blocks.18/self_attn/Reshape_1_output_0", "/blocks.18/self_attn/Mul_2_output_0", "/blocks.18/self_attn/Shape_3_output_0", "Shape2507", "Rank2509", "BinaryOp2511", "Unsqueeze2512", "BinaryOp2514", "Unsqueeze2515", "StridedSlice2518", "Squeeze2519", "BinaryOp2520", "BinaryOp2521", "/blocks.18/self_attn/Gather_3_output_0", "/blocks.18/self_attn/Div_1_output_0", "/blocks.18/self_attn/Unsqueeze_9_output_0", "/blocks.18/self_attn/Slice_3_output_0", "/blocks.18/self_attn/Neg_1_output_0", "/blocks.18/self_attn/Unsqueeze_8_output_0", "/blocks.18/self_attn/Slice_2_output_0", "/blocks.18/self_attn/Concat_4_output_0", "/blocks.18/self_attn/Mul_3_output_0", "/blocks.18/self_attn/Add_1_output_0", "/blocks.18/self_attn/v_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_4_output_0", "/blocks.18/self_attn/Unsqueeze_5_output_0", "/blocks.18/self_attn/Concat_2_output_0", "/blocks.18/self_attn/Reshape_2_output_0", "/blocks.18/self_attn/fused_attn/FusedAttention_output_0", "/blocks.18/self_attn/o_proj/FakeLinear_output_0", "/blocks.18/Add_output_0", "/blocks.18/post_attention_layernorm/Mul_1_output_0", "/blocks.18/mlp/gate_proj/FakeLinear_output_0", "/blocks.18/mlp/act_fn/Mul_output_0", "/blocks.18/mlp/up_proj/FakeLinear_output_0", "/blocks.18/mlp/Mul_output_0", "/blocks.18/mlp/down_proj/FakeLinear_output_0", "/blocks.18/Add_1_output_0", "/blocks.19/Reshape_output_0", "/blocks.19/input_layernorm/Mul_1_output_0", "/blocks.19/self_attn/q_proj/FakeLinear_output_0", "/blocks.19/self_attn/Shape_output_0", "Shape2567", "Rank2569", "BinaryOp2571", "Unsqueeze2572", "BinaryOp2574", "Unsqueeze2575", "StridedSlice2578", "Squeeze2579", "BinaryOp2581", "/blocks.19/self_attn/Gather_output_0", "/blocks.19/self_attn/Unsqueeze_output_0", "Unsqueeze2589", "Unsqueeze2592", "StridedSlice2595", "Squeeze2596", "BinaryOp2597", "BinaryOp2598", "/blocks.19/self_attn/Gather_1_output_0", "/blocks.19/self_attn/Unsqueeze_1_output_0", "/blocks.19/self_attn/Concat_output_0", "/blocks.19/self_attn/Reshape_output_0", "/blocks.19/self_attn/Mul_output_0", "/blocks.19/self_attn/Shape_2_output_0", "Shape2605", "Rank2607", "BinaryOp2609", "Unsqueeze2610", "BinaryOp2612", "Unsqueeze2613", "StridedSlice2616", "Squeeze2617", "BinaryOp2618", "BinaryOp2619", "/blocks.19/self_attn/Gather_2_output_0", "/blocks.19/self_attn/Div_output_0", "/blocks.19/self_attn/Unsqueeze_7_output_0", "/blocks.19/self_attn/Slice_1_output_0", "/blocks.19/self_attn/Neg_output_0", "/blocks.19/self_attn/Unsqueeze_6_output_0", "/blocks.19/self_attn/Slice_output_0", "/blocks.19/self_attn/Concat_3_output_0", "/blocks.19/self_attn/Mul_1_output_0", "/blocks.19/self_attn/Add_output_0", "/blocks.19/self_attn/k_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_2_output_0", "/blocks.19/self_attn/Unsqueeze_3_output_0", "/blocks.19/self_attn/Concat_1_output_0", "/blocks.19/self_attn/Reshape_1_output_0", "/blocks.19/self_attn/Mul_2_output_0", "/blocks.19/self_attn/Shape_3_output_0", "Shape2638", "Rank2640", "BinaryOp2642", "Unsqueeze2643", "BinaryOp2645", "Unsqueeze2646", "StridedSlice2649", "Squeeze2650", "BinaryOp2651", "BinaryOp2652", "/blocks.19/self_attn/Gather_3_output_0", "/blocks.19/self_attn/Div_1_output_0", "/blocks.19/self_attn/Unsqueeze_9_output_0", "/blocks.19/self_attn/Slice_3_output_0", "/blocks.19/self_attn/Neg_1_output_0", "/blocks.19/self_attn/Unsqueeze_8_output_0", "/blocks.19/self_attn/Slice_2_output_0", "/blocks.19/self_attn/Concat_4_output_0", "/blocks.19/self_attn/Mul_3_output_0", "/blocks.19/self_attn/Add_1_output_0", "/blocks.19/self_attn/v_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_4_output_0", "/blocks.19/self_attn/Unsqueeze_5_output_0", "/blocks.19/self_attn/Concat_2_output_0", "/blocks.19/self_attn/Reshape_2_output_0", "/blocks.19/self_attn/fused_attn/FusedAttention_output_0", "/blocks.19/self_attn/o_proj/FakeLinear_output_0", "/blocks.19/Add_output_0", "/blocks.19/post_attention_layernorm/Mul_1_output_0", "/blocks.19/mlp/gate_proj/FakeLinear_output_0", "/blocks.19/mlp/act_fn/Mul_output_0", "/blocks.19/mlp/up_proj/FakeLinear_output_0", "/blocks.19/mlp/Mul_output_0", "/blocks.19/mlp/down_proj/FakeLinear_output_0", "/blocks.19/Add_1_output_0", "/blocks.20/Reshape_output_0", "/blocks.20/input_layernorm/Mul_1_output_0", "/blocks.20/self_attn/q_proj/FakeLinear_output_0", "/blocks.20/self_attn/Shape_output_0", "Shape2698", "Rank2700", "BinaryOp2702", "Unsqueeze2703", "BinaryOp2705", "Unsqueeze2706", "StridedSlice2709", "Squeeze2710", "BinaryOp2712", "/blocks.20/self_attn/Gather_output_0", "/blocks.20/self_attn/Unsqueeze_output_0", "Unsqueeze2720", "Unsqueeze2723", "StridedSlice2726", "Squeeze2727", "BinaryOp2728", "BinaryOp2729", "/blocks.20/self_attn/Gather_1_output_0", "/blocks.20/self_attn/Unsqueeze_1_output_0", "/blocks.20/self_attn/Concat_output_0", "/blocks.20/self_attn/Reshape_output_0", "/blocks.20/self_attn/Mul_output_0", "/blocks.20/self_attn/Shape_2_output_0", "Shape2736", "Rank2738", "BinaryOp2740", "Unsqueeze2741", "BinaryOp2743", "Unsqueeze2744", "StridedSlice2747", "Squeeze2748", "BinaryOp2749", "BinaryOp2750", "/blocks.20/self_attn/Gather_2_output_0", "/blocks.20/self_attn/Div_output_0", "/blocks.20/self_attn/Unsqueeze_7_output_0", "/blocks.20/self_attn/Slice_1_output_0", "/blocks.20/self_attn/Neg_output_0", "/blocks.20/self_attn/Unsqueeze_6_output_0", "/blocks.20/self_attn/Slice_output_0", "/blocks.20/self_attn/Concat_3_output_0", "/blocks.20/self_attn/Mul_1_output_0", "/blocks.20/self_attn/Add_output_0", "/blocks.20/self_attn/k_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_2_output_0", "/blocks.20/self_attn/Unsqueeze_3_output_0", "/blocks.20/self_attn/Concat_1_output_0", "/blocks.20/self_attn/Reshape_1_output_0", "/blocks.20/self_attn/Mul_2_output_0", "/blocks.20/self_attn/Shape_3_output_0", "Shape2769", "Rank2771", "BinaryOp2773", "Unsqueeze2774", "BinaryOp2776", "Unsqueeze2777", "StridedSlice2780", "Squeeze2781", "BinaryOp2782", "BinaryOp2783", "/blocks.20/self_attn/Gather_3_output_0", "/blocks.20/self_attn/Div_1_output_0", "/blocks.20/self_attn/Unsqueeze_9_output_0", "/blocks.20/self_attn/Slice_3_output_0", "/blocks.20/self_attn/Neg_1_output_0", "/blocks.20/self_attn/Unsqueeze_8_output_0", "/blocks.20/self_attn/Slice_2_output_0", "/blocks.20/self_attn/Concat_4_output_0", "/blocks.20/self_attn/Mul_3_output_0", "/blocks.20/self_attn/Add_1_output_0", "/blocks.20/self_attn/v_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_4_output_0", "/blocks.20/self_attn/Unsqueeze_5_output_0", "/blocks.20/self_attn/Concat_2_output_0", "/blocks.20/self_attn/Reshape_2_output_0", "/blocks.20/self_attn/fused_attn/FusedAttention_output_0", "/blocks.20/self_attn/o_proj/FakeLinear_output_0", "/blocks.20/Add_output_0", "/blocks.20/post_attention_layernorm/Mul_1_output_0", "/blocks.20/mlp/gate_proj/FakeLinear_output_0", "/blocks.20/mlp/act_fn/Mul_output_0", "/blocks.20/mlp/up_proj/FakeLinear_output_0", "/blocks.20/mlp/Mul_output_0", "/blocks.20/mlp/down_proj/FakeLinear_output_0", "/blocks.20/Add_1_output_0", "/blocks.21/Reshape_output_0", "/blocks.21/input_layernorm/Mul_1_output_0", "/blocks.21/self_attn/q_proj/FakeLinear_output_0", "/blocks.21/self_attn/Shape_output_0", "Shape2829", "Rank2831", "BinaryOp2833", "Unsqueeze2834", "BinaryOp2836", "Unsqueeze2837", "StridedSlice2840", "Squeeze2841", "BinaryOp2843", "/blocks.21/self_attn/Gather_output_0", "/blocks.21/self_attn/Unsqueeze_output_0", "Unsqueeze2851", "Unsqueeze2854", "StridedSlice2857", "Squeeze2858", "BinaryOp2859", "BinaryOp2860", "/blocks.21/self_attn/Gather_1_output_0", "/blocks.21/self_attn/Unsqueeze_1_output_0", "/blocks.21/self_attn/Concat_output_0", "/blocks.21/self_attn/Reshape_output_0", "/blocks.21/self_attn/Mul_output_0", "/blocks.21/self_attn/Shape_2_output_0", "Shape2867", "Rank2869", "BinaryOp2871", "Unsqueeze2872", "BinaryOp2874", "Unsqueeze2875", "StridedSlice2878", "Squeeze2879", "BinaryOp2880", "BinaryOp2881", "/blocks.21/self_attn/Gather_2_output_0", "/blocks.21/self_attn/Div_output_0", "/blocks.21/self_attn/Unsqueeze_7_output_0", "/blocks.21/self_attn/Slice_1_output_0", "/blocks.21/self_attn/Neg_output_0", "/blocks.21/self_attn/Unsqueeze_6_output_0", "/blocks.21/self_attn/Slice_output_0", "/blocks.21/self_attn/Concat_3_output_0", "/blocks.21/self_attn/Mul_1_output_0", "/blocks.21/self_attn/Add_output_0", "/blocks.21/self_attn/k_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_2_output_0", "/blocks.21/self_attn/Unsqueeze_3_output_0", "/blocks.21/self_attn/Concat_1_output_0", "/blocks.21/self_attn/Reshape_1_output_0", "/blocks.21/self_attn/Mul_2_output_0", "/blocks.21/self_attn/Shape_3_output_0", "Shape2900", "Rank2902", "BinaryOp2904", "Unsqueeze2905", "BinaryOp2907", "Unsqueeze2908", "StridedSlice2911", "Squeeze2912", "BinaryOp2913", "BinaryOp2914", "/blocks.21/self_attn/Gather_3_output_0", "/blocks.21/self_attn/Div_1_output_0", "/blocks.21/self_attn/Unsqueeze_9_output_0", "/blocks.21/self_attn/Slice_3_output_0", "/blocks.21/self_attn/Neg_1_output_0", "/blocks.21/self_attn/Unsqueeze_8_output_0", "/blocks.21/self_attn/Slice_2_output_0", "/blocks.21/self_attn/Concat_4_output_0", "/blocks.21/self_attn/Mul_3_output_0", "/blocks.21/self_attn/Add_1_output_0", "/blocks.21/self_attn/v_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_4_output_0", "/blocks.21/self_attn/Unsqueeze_5_output_0", "/blocks.21/self_attn/Concat_2_output_0", "/blocks.21/self_attn/Reshape_2_output_0", "/blocks.21/self_attn/fused_attn/FusedAttention_output_0", "/blocks.21/self_attn/o_proj/FakeLinear_output_0", "/blocks.21/Add_output_0", "/blocks.21/post_attention_layernorm/Mul_1_output_0", "/blocks.21/mlp/gate_proj/FakeLinear_output_0", "/blocks.21/mlp/act_fn/Mul_output_0", "/blocks.21/mlp/up_proj/FakeLinear_output_0", "/blocks.21/mlp/Mul_output_0", "/blocks.21/mlp/down_proj/FakeLinear_output_0", "/blocks.21/Add_1_output_0", "/blocks.22/Reshape_output_0", "/blocks.22/input_layernorm/Mul_1_output_0", "/blocks.22/self_attn/q_proj/FakeLinear_output_0", "/blocks.22/self_attn/Shape_output_0", "Shape2960", "Rank2962", "BinaryOp2964", "Unsqueeze2965", "BinaryOp2967", "Unsqueeze2968", "StridedSlice2971", "Squeeze2972", "BinaryOp2974", "/blocks.22/self_attn/Gather_output_0", "/blocks.22/self_attn/Unsqueeze_output_0", "Unsqueeze2982", "Unsqueeze2985", "StridedSlice2988", "Squeeze2989", "BinaryOp2990", "BinaryOp2991", "/blocks.22/self_attn/Gather_1_output_0", "/blocks.22/self_attn/Unsqueeze_1_output_0", "/blocks.22/self_attn/Concat_output_0", "/blocks.22/self_attn/Reshape_output_0", "/blocks.22/self_attn/Mul_output_0", "/blocks.22/self_attn/Shape_2_output_0", "Shape2998", "Rank3000", "BinaryOp3002", "Unsqueeze3003", "BinaryOp3005", "Unsqueeze3006", "StridedSlice3009", "Squeeze3010", "BinaryOp3011", "BinaryOp3012", "/blocks.22/self_attn/Gather_2_output_0", "/blocks.22/self_attn/Div_output_0", "/blocks.22/self_attn/Unsqueeze_7_output_0", "/blocks.22/self_attn/Slice_1_output_0", "/blocks.22/self_attn/Neg_output_0", "/blocks.22/self_attn/Unsqueeze_6_output_0", "/blocks.22/self_attn/Slice_output_0", "/blocks.22/self_attn/Concat_3_output_0", "/blocks.22/self_attn/Mul_1_output_0", "/blocks.22/self_attn/Add_output_0", "/blocks.22/self_attn/k_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_2_output_0", "/blocks.22/self_attn/Unsqueeze_3_output_0", "/blocks.22/self_attn/Concat_1_output_0", "/blocks.22/self_attn/Reshape_1_output_0", "/blocks.22/self_attn/Mul_2_output_0", "/blocks.22/self_attn/Shape_3_output_0", "Shape3031", "Rank3033", "BinaryOp3035", "Unsqueeze3036", "BinaryOp3038", "Unsqueeze3039", "StridedSlice3042", "Squeeze3043", "BinaryOp3044", "BinaryOp3045", "/blocks.22/self_attn/Gather_3_output_0", "/blocks.22/self_attn/Div_1_output_0", "/blocks.22/self_attn/Unsqueeze_9_output_0", "/blocks.22/self_attn/Slice_3_output_0", "/blocks.22/self_attn/Neg_1_output_0", "/blocks.22/self_attn/Unsqueeze_8_output_0", "/blocks.22/self_attn/Slice_2_output_0", "/blocks.22/self_attn/Concat_4_output_0", "/blocks.22/self_attn/Mul_3_output_0", "/blocks.22/self_attn/Add_1_output_0", "/blocks.22/self_attn/v_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_4_output_0", "/blocks.22/self_attn/Unsqueeze_5_output_0", "/blocks.22/self_attn/Concat_2_output_0", "/blocks.22/self_attn/Reshape_2_output_0", "/blocks.22/self_attn/fused_attn/FusedAttention_output_0", "/blocks.22/self_attn/o_proj/FakeLinear_output_0", "/blocks.22/Add_output_0", "/blocks.22/post_attention_layernorm/Mul_1_output_0", "/blocks.22/mlp/gate_proj/FakeLinear_output_0", "/blocks.22/mlp/act_fn/Mul_output_0", "/blocks.22/mlp/up_proj/FakeLinear_output_0", "/blocks.22/mlp/Mul_output_0", "/blocks.22/mlp/down_proj/FakeLinear_output_0", "/blocks.22/Add_1_output_0", "/blocks.23/Reshape_output_0", "/blocks.23/input_layernorm/Mul_1_output_0", "/blocks.23/self_attn/q_proj/FakeLinear_output_0", "/blocks.23/self_attn/Shape_output_0", "Shape3091", "Rank3093", "BinaryOp3095", "Unsqueeze3096", "BinaryOp3098", "Unsqueeze3099", "StridedSlice3102", "Squeeze3103", "BinaryOp3105", "/blocks.23/self_attn/Gather_output_0", "/blocks.23/self_attn/Unsqueeze_output_0", "Unsqueeze3113", "Unsqueeze3116", "StridedSlice3119", "Squeeze3120", "BinaryOp3121", "BinaryOp3122", "/blocks.23/self_attn/Gather_1_output_0", "/blocks.23/self_attn/Unsqueeze_1_output_0", "/blocks.23/self_attn/Concat_output_0", "/blocks.23/self_attn/Reshape_output_0", "/blocks.23/self_attn/Mul_output_0", "/blocks.23/self_attn/Shape_2_output_0", "Shape3129", "Rank3131", "BinaryOp3133", "Unsqueeze3134", "BinaryOp3136", "Unsqueeze3137", "StridedSlice3140", "Squeeze3141", "BinaryOp3142", "BinaryOp3143", "/blocks.23/self_attn/Gather_2_output_0", "/blocks.23/self_attn/Div_output_0", "/blocks.23/self_attn/Unsqueeze_7_output_0", "/blocks.23/self_attn/Slice_1_output_0", "/blocks.23/self_attn/Neg_output_0", "/blocks.23/self_attn/Unsqueeze_6_output_0", "/blocks.23/self_attn/Slice_output_0", "/blocks.23/self_attn/Concat_3_output_0", "/blocks.23/self_attn/Mul_1_output_0", "/blocks.23/self_attn/Add_output_0", "/blocks.23/self_attn/k_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_2_output_0", "/blocks.23/self_attn/Unsqueeze_3_output_0", "/blocks.23/self_attn/Concat_1_output_0", "/blocks.23/self_attn/Reshape_1_output_0", "/blocks.23/self_attn/Mul_2_output_0", "/blocks.23/self_attn/Shape_3_output_0", "Shape3162", "Rank3164", "BinaryOp3166", "Unsqueeze3167", "BinaryOp3169", "Unsqueeze3170", "StridedSlice3173", "Squeeze3174", "BinaryOp3175", "BinaryOp3176", "/blocks.23/self_attn/Gather_3_output_0", "/blocks.23/self_attn/Div_1_output_0", "/blocks.23/self_attn/Unsqueeze_9_output_0", "/blocks.23/self_attn/Slice_3_output_0", "/blocks.23/self_attn/Neg_1_output_0", "/blocks.23/self_attn/Unsqueeze_8_output_0", "/blocks.23/self_attn/Slice_2_output_0", "/blocks.23/self_attn/Concat_4_output_0", "/blocks.23/self_attn/Mul_3_output_0", "/blocks.23/self_attn/Add_1_output_0", "/blocks.23/self_attn/v_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_4_output_0", "/blocks.23/self_attn/Unsqueeze_5_output_0", "/blocks.23/self_attn/Concat_2_output_0", "/blocks.23/self_attn/Reshape_2_output_0", "/blocks.23/self_attn/fused_attn/FusedAttention_output_0", "/blocks.23/self_attn/o_proj/FakeLinear_output_0", "/blocks.23/Add_output_0", "/blocks.23/post_attention_layernorm/Mul_1_output_0", "/blocks.23/mlp/gate_proj/FakeLinear_output_0", "/blocks.23/mlp/act_fn/Mul_output_0", "/blocks.23/mlp/up_proj/FakeLinear_output_0", "/blocks.23/mlp/Mul_output_0", "/blocks.23/mlp/down_proj/FakeLinear_output_0", "/blocks.23/Add_1_output_0", "/blocks.24/Reshape_output_0", "/blocks.24/input_layernorm/Mul_1_output_0", "/blocks.24/self_attn/q_proj/FakeLinear_output_0", "/blocks.24/self_attn/Shape_output_0", "Shape3222", "Rank3224", "BinaryOp3226", "Unsqueeze3227", "BinaryOp3229", "Unsqueeze3230", "StridedSlice3233", "Squeeze3234", "BinaryOp3236", "/blocks.24/self_attn/Gather_output_0", "/blocks.24/self_attn/Unsqueeze_output_0", "Unsqueeze3244", "Unsqueeze3247", "StridedSlice3250", "Squeeze3251", "BinaryOp3252", "BinaryOp3253", "/blocks.24/self_attn/Gather_1_output_0", "/blocks.24/self_attn/Unsqueeze_1_output_0", "/blocks.24/self_attn/Concat_output_0", "/blocks.24/self_attn/Reshape_output_0", "/blocks.24/self_attn/Mul_output_0", "/blocks.24/self_attn/Shape_2_output_0", "Shape3260", "Rank3262", "BinaryOp3264", "Unsqueeze3265", "BinaryOp3267", "Unsqueeze3268", "StridedSlice3271", "Squeeze3272", "BinaryOp3273", "BinaryOp3274", "/blocks.24/self_attn/Gather_2_output_0", "/blocks.24/self_attn/Div_output_0", "/blocks.24/self_attn/Unsqueeze_7_output_0", "/blocks.24/self_attn/Slice_1_output_0", "/blocks.24/self_attn/Neg_output_0", "/blocks.24/self_attn/Unsqueeze_6_output_0", "/blocks.24/self_attn/Slice_output_0", "/blocks.24/self_attn/Concat_3_output_0", "/blocks.24/self_attn/Mul_1_output_0", "/blocks.24/self_attn/Add_output_0", "/blocks.24/self_attn/k_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_2_output_0", "/blocks.24/self_attn/Unsqueeze_3_output_0", "/blocks.24/self_attn/Concat_1_output_0", "/blocks.24/self_attn/Reshape_1_output_0", "/blocks.24/self_attn/Mul_2_output_0", "/blocks.24/self_attn/Shape_3_output_0", "Shape3293", "Rank3295", "BinaryOp3297", "Unsqueeze3298", "BinaryOp3300", "Unsqueeze3301", "StridedSlice3304", "Squeeze3305", "BinaryOp3306", "BinaryOp3307", "/blocks.24/self_attn/Gather_3_output_0", "/blocks.24/self_attn/Div_1_output_0", "/blocks.24/self_attn/Unsqueeze_9_output_0", "/blocks.24/self_attn/Slice_3_output_0", "/blocks.24/self_attn/Neg_1_output_0", "/blocks.24/self_attn/Unsqueeze_8_output_0", "/blocks.24/self_attn/Slice_2_output_0", "/blocks.24/self_attn/Concat_4_output_0", "/blocks.24/self_attn/Mul_3_output_0", "/blocks.24/self_attn/Add_1_output_0", "/blocks.24/self_attn/v_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_4_output_0", "/blocks.24/self_attn/Unsqueeze_5_output_0", "/blocks.24/self_attn/Concat_2_output_0", "/blocks.24/self_attn/Reshape_2_output_0", "/blocks.24/self_attn/fused_attn/FusedAttention_output_0", "/blocks.24/self_attn/o_proj/FakeLinear_output_0", "/blocks.24/Add_output_0", "/blocks.24/post_attention_layernorm/Mul_1_output_0", "/blocks.24/mlp/gate_proj/FakeLinear_output_0", "/blocks.24/mlp/act_fn/Mul_output_0", "/blocks.24/mlp/up_proj/FakeLinear_output_0", "/blocks.24/mlp/Mul_output_0", "/blocks.24/mlp/down_proj/FakeLinear_output_0", "/blocks.24/Add_1_output_0", "/blocks.25/Reshape_output_0", "/blocks.25/input_layernorm/Mul_1_output_0", "/blocks.25/self_attn/q_proj/FakeLinear_output_0", "/blocks.25/self_attn/Shape_output_0", "Shape3353", "Rank3355", "BinaryOp3357", "Unsqueeze3358", "BinaryOp3360", "Unsqueeze3361", "StridedSlice3364", "Squeeze3365", "BinaryOp3367", "/blocks.25/self_attn/Gather_output_0", "/blocks.25/self_attn/Unsqueeze_output_0", "Unsqueeze3375", "Unsqueeze3378", "StridedSlice3381", "Squeeze3382", "BinaryOp3383", "BinaryOp3384", "/blocks.25/self_attn/Gather_1_output_0", "/blocks.25/self_attn/Unsqueeze_1_output_0", "/blocks.25/self_attn/Concat_output_0", "/blocks.25/self_attn/Reshape_output_0", "/blocks.25/self_attn/Mul_output_0", "/blocks.25/self_attn/Shape_2_output_0", "Shape3391", "Rank3393", "BinaryOp3395", "Unsqueeze3396", "BinaryOp3398", "Unsqueeze3399", "StridedSlice3402", "Squeeze3403", "BinaryOp3404", "BinaryOp3405", "/blocks.25/self_attn/Gather_2_output_0", "/blocks.25/self_attn/Div_output_0", "/blocks.25/self_attn/Unsqueeze_7_output_0", "/blocks.25/self_attn/Slice_1_output_0", "/blocks.25/self_attn/Neg_output_0", "/blocks.25/self_attn/Unsqueeze_6_output_0", "/blocks.25/self_attn/Slice_output_0", "/blocks.25/self_attn/Concat_3_output_0", "/blocks.25/self_attn/Mul_1_output_0", "/blocks.25/self_attn/Add_output_0", "/blocks.25/self_attn/k_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_2_output_0", "/blocks.25/self_attn/Unsqueeze_3_output_0", "/blocks.25/self_attn/Concat_1_output_0", "/blocks.25/self_attn/Reshape_1_output_0", "/blocks.25/self_attn/Mul_2_output_0", "/blocks.25/self_attn/Shape_3_output_0", "Shape3424", "Rank3426", "BinaryOp3428", "Unsqueeze3429", "BinaryOp3431", "Unsqueeze3432", "StridedSlice3435", "Squeeze3436", "BinaryOp3437", "BinaryOp3438", "/blocks.25/self_attn/Gather_3_output_0", "/blocks.25/self_attn/Div_1_output_0", "/blocks.25/self_attn/Unsqueeze_9_output_0", "/blocks.25/self_attn/Slice_3_output_0", "/blocks.25/self_attn/Neg_1_output_0", "/blocks.25/self_attn/Unsqueeze_8_output_0", "/blocks.25/self_attn/Slice_2_output_0", "/blocks.25/self_attn/Concat_4_output_0", "/blocks.25/self_attn/Mul_3_output_0", "/blocks.25/self_attn/Add_1_output_0", "/blocks.25/self_attn/v_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_4_output_0", "/blocks.25/self_attn/Unsqueeze_5_output_0", "/blocks.25/self_attn/Concat_2_output_0", "/blocks.25/self_attn/Reshape_2_output_0", "/blocks.25/self_attn/fused_attn/FusedAttention_output_0", "/blocks.25/self_attn/o_proj/FakeLinear_output_0", "/blocks.25/Add_output_0", "/blocks.25/post_attention_layernorm/Mul_1_output_0", "/blocks.25/mlp/gate_proj/FakeLinear_output_0", "/blocks.25/mlp/act_fn/Mul_output_0", "/blocks.25/mlp/up_proj/FakeLinear_output_0", "/blocks.25/mlp/Mul_output_0", "/blocks.25/mlp/down_proj/FakeLinear_output_0", "/blocks.25/Add_1_output_0", "/blocks.26/Reshape_output_0", "/blocks.26/input_layernorm/Mul_1_output_0", "/blocks.26/self_attn/q_proj/FakeLinear_output_0", "/blocks.26/self_attn/Shape_output_0", "Shape3484", "Rank3486", "BinaryOp3488", "Unsqueeze3489", "BinaryOp3491", "Unsqueeze3492", "StridedSlice3495", "Squeeze3496", "BinaryOp3498", "/blocks.26/self_attn/Gather_output_0", "/blocks.26/self_attn/Unsqueeze_output_0", "Unsqueeze3506", "Unsqueeze3509", "StridedSlice3512", "Squeeze3513", "BinaryOp3514", "BinaryOp3515", "/blocks.26/self_attn/Gather_1_output_0", "/blocks.26/self_attn/Unsqueeze_1_output_0", "/blocks.26/self_attn/Concat_output_0", "/blocks.26/self_attn/Reshape_output_0", "/blocks.26/self_attn/Mul_output_0", "/blocks.26/self_attn/Shape_2_output_0", "Shape3522", "Rank3524", "BinaryOp3526", "Unsqueeze3527", "BinaryOp3529", "Unsqueeze3530", "StridedSlice3533", "Squeeze3534", "BinaryOp3535", "BinaryOp3536", "/blocks.26/self_attn/Gather_2_output_0", "/blocks.26/self_attn/Div_output_0", "/blocks.26/self_attn/Unsqueeze_7_output_0", "/blocks.26/self_attn/Slice_1_output_0", "/blocks.26/self_attn/Neg_output_0", "/blocks.26/self_attn/Unsqueeze_6_output_0", "/blocks.26/self_attn/Slice_output_0", "/blocks.26/self_attn/Concat_3_output_0", "/blocks.26/self_attn/Mul_1_output_0", "/blocks.26/self_attn/Add_output_0", "/blocks.26/self_attn/k_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_2_output_0", "/blocks.26/self_attn/Unsqueeze_3_output_0", "/blocks.26/self_attn/Concat_1_output_0", "/blocks.26/self_attn/Reshape_1_output_0", "/blocks.26/self_attn/Mul_2_output_0", "/blocks.26/self_attn/Shape_3_output_0", "Shape3555", "Rank3557", "BinaryOp3559", "Unsqueeze3560", "BinaryOp3562", "Unsqueeze3563", "StridedSlice3566", "Squeeze3567", "BinaryOp3568", "BinaryOp3569", "/blocks.26/self_attn/Gather_3_output_0", "/blocks.26/self_attn/Div_1_output_0", "/blocks.26/self_attn/Unsqueeze_9_output_0", "/blocks.26/self_attn/Slice_3_output_0", "/blocks.26/self_attn/Neg_1_output_0", "/blocks.26/self_attn/Unsqueeze_8_output_0", "/blocks.26/self_attn/Slice_2_output_0", "/blocks.26/self_attn/Concat_4_output_0", "/blocks.26/self_attn/Mul_3_output_0", "/blocks.26/self_attn/Add_1_output_0", "/blocks.26/self_attn/v_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_4_output_0", "/blocks.26/self_attn/Unsqueeze_5_output_0", "/blocks.26/self_attn/Concat_2_output_0", "/blocks.26/self_attn/Reshape_2_output_0", "/blocks.26/self_attn/fused_attn/FusedAttention_output_0", "/blocks.26/self_attn/o_proj/FakeLinear_output_0", "/blocks.26/Add_output_0", "/blocks.26/post_attention_layernorm/Mul_1_output_0", "/blocks.26/mlp/gate_proj/FakeLinear_output_0", "/blocks.26/mlp/act_fn/Mul_output_0", "/blocks.26/mlp/up_proj/FakeLinear_output_0", "/blocks.26/mlp/Mul_output_0", "/blocks.26/mlp/down_proj/FakeLinear_output_0", "/blocks.26/Add_1_output_0", "/blocks.27/Reshape_output_0", "/blocks.27/input_layernorm/Mul_1_output_0", "/blocks.27/self_attn/q_proj/FakeLinear_output_0", "/blocks.27/self_attn/Shape_output_0", "Shape3615", "Rank3617", "BinaryOp3619", "Unsqueeze3620", "BinaryOp3622", "Unsqueeze3623", "StridedSlice3626", "Squeeze3627", "BinaryOp3629", "/blocks.27/self_attn/Gather_output_0", "/blocks.27/self_attn/Unsqueeze_output_0", "Unsqueeze3637", "Unsqueeze3640", "StridedSlice3643", "Squeeze3644", "BinaryOp3645", "BinaryOp3646", "/blocks.27/self_attn/Gather_1_output_0", "/blocks.27/self_attn/Unsqueeze_1_output_0", "/blocks.27/self_attn/Concat_output_0", "/blocks.27/self_attn/Reshape_output_0", "/blocks.27/self_attn/Mul_output_0", "/blocks.27/self_attn/Shape_2_output_0", "Shape3653", "Rank3655", "BinaryOp3657", "Unsqueeze3658", "BinaryOp3660", "Unsqueeze3661", "StridedSlice3664", "Squeeze3665", "BinaryOp3666", "BinaryOp3667", "/blocks.27/self_attn/Gather_2_output_0", "/blocks.27/self_attn/Div_output_0", "/blocks.27/self_attn/Unsqueeze_7_output_0", "/blocks.27/self_attn/Slice_1_output_0", "/blocks.27/self_attn/Neg_output_0", "/blocks.27/self_attn/Unsqueeze_6_output_0", "/blocks.27/self_attn/Slice_output_0", "/blocks.27/self_attn/Concat_3_output_0", "/blocks.27/self_attn/Mul_1_output_0", "/blocks.27/self_attn/Add_output_0", "/blocks.27/self_attn/k_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_2_output_0", "/blocks.27/self_attn/Unsqueeze_3_output_0", "/blocks.27/self_attn/Concat_1_output_0", "/blocks.27/self_attn/Reshape_1_output_0", "/blocks.27/self_attn/Mul_2_output_0", "/blocks.27/self_attn/Shape_3_output_0", "Shape3686", "Rank3688", "BinaryOp3690", "Unsqueeze3691", "BinaryOp3693", "Unsqueeze3694", "StridedSlice3697", "Squeeze3698", "BinaryOp3699", "BinaryOp3700", "/blocks.27/self_attn/Gather_3_output_0", "/blocks.27/self_attn/Div_1_output_0", "/blocks.27/self_attn/Unsqueeze_9_output_0", "/blocks.27/self_attn/Slice_3_output_0", "/blocks.27/self_attn/Neg_1_output_0", "/blocks.27/self_attn/Unsqueeze_8_output_0", "/blocks.27/self_attn/Slice_2_output_0", "/blocks.27/self_attn/Concat_4_output_0", "/blocks.27/self_attn/Mul_3_output_0", "/blocks.27/self_attn/Add_1_output_0", "/blocks.27/self_attn/v_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_4_output_0", "/blocks.27/self_attn/Unsqueeze_5_output_0", "/blocks.27/self_attn/Concat_2_output_0", "/blocks.27/self_attn/Reshape_2_output_0", "/blocks.27/self_attn/fused_attn/FusedAttention_output_0", "/blocks.27/self_attn/o_proj/FakeLinear_output_0", "/blocks.27/Add_output_0", "/blocks.27/post_attention_layernorm/Mul_1_output_0", "/blocks.27/mlp/gate_proj/FakeLinear_output_0", "/blocks.27/mlp/act_fn/Mul_output_0", "/blocks.27/mlp/up_proj/FakeLinear_output_0", "/blocks.27/mlp/Mul_output_0", "/blocks.27/mlp/down_proj/FakeLinear_output_0", "/blocks.27/Add_1_output_0", "/blocks.28/Reshape_output_0", "/blocks.28/input_layernorm/Mul_1_output_0", "/blocks.28/self_attn/q_proj/FakeLinear_output_0", "/blocks.28/self_attn/Shape_output_0", "Shape3746", "Rank3748", "BinaryOp3750", "Unsqueeze3751", "BinaryOp3753", "Unsqueeze3754", "StridedSlice3757", "Squeeze3758", "BinaryOp3760", "/blocks.28/self_attn/Gather_output_0", "/blocks.28/self_attn/Unsqueeze_output_0", "Unsqueeze3768", "Unsqueeze3771", "StridedSlice3774", "Squeeze3775", "BinaryOp3776", "BinaryOp3777", "/blocks.28/self_attn/Gather_1_output_0", "/blocks.28/self_attn/Unsqueeze_1_output_0", "/blocks.28/self_attn/Concat_output_0", "/blocks.28/self_attn/Reshape_output_0", "/blocks.28/self_attn/Mul_output_0", "/blocks.28/self_attn/Shape_2_output_0", "Shape3784", "Rank3786", "BinaryOp3788", "Unsqueeze3789", "BinaryOp3791", "Unsqueeze3792", "StridedSlice3795", "Squeeze3796", "BinaryOp3797", "BinaryOp3798", "/blocks.28/self_attn/Gather_2_output_0", "/blocks.28/self_attn/Div_output_0", "/blocks.28/self_attn/Unsqueeze_7_output_0", "/blocks.28/self_attn/Slice_1_output_0", "/blocks.28/self_attn/Neg_output_0", "/blocks.28/self_attn/Unsqueeze_6_output_0", "/blocks.28/self_attn/Slice_output_0", "/blocks.28/self_attn/Concat_3_output_0", "/blocks.28/self_attn/Mul_1_output_0", "/blocks.28/self_attn/Add_output_0", "/blocks.28/self_attn/k_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_2_output_0", "/blocks.28/self_attn/Unsqueeze_3_output_0", "/blocks.28/self_attn/Concat_1_output_0", "/blocks.28/self_attn/Reshape_1_output_0", "/blocks.28/self_attn/Mul_2_output_0", "/blocks.28/self_attn/Shape_3_output_0", "Shape3817", "Rank3819", "BinaryOp3821", "Unsqueeze3822", "BinaryOp3824", "Unsqueeze3825", "StridedSlice3828", "Squeeze3829", "BinaryOp3830", "BinaryOp3831", "/blocks.28/self_attn/Gather_3_output_0", "/blocks.28/self_attn/Div_1_output_0", "/blocks.28/self_attn/Unsqueeze_9_output_0", "/blocks.28/self_attn/Slice_3_output_0", "/blocks.28/self_attn/Neg_1_output_0", "/blocks.28/self_attn/Unsqueeze_8_output_0", "/blocks.28/self_attn/Slice_2_output_0", "/blocks.28/self_attn/Concat_4_output_0", "/blocks.28/self_attn/Mul_3_output_0", "/blocks.28/self_attn/Add_1_output_0", "/blocks.28/self_attn/v_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_4_output_0", "/blocks.28/self_attn/Unsqueeze_5_output_0", "/blocks.28/self_attn/Concat_2_output_0", "/blocks.28/self_attn/Reshape_2_output_0", "/blocks.28/self_attn/fused_attn/FusedAttention_output_0", "/blocks.28/self_attn/o_proj/FakeLinear_output_0", "/blocks.28/Add_output_0", "/blocks.28/post_attention_layernorm/Mul_1_output_0", "/blocks.28/mlp/gate_proj/FakeLinear_output_0", "/blocks.28/mlp/act_fn/Mul_output_0", "/blocks.28/mlp/up_proj/FakeLinear_output_0", "/blocks.28/mlp/Mul_output_0", "/blocks.28/mlp/down_proj/FakeLinear_output_0", "/blocks.28/Add_1_output_0", "/blocks.29/Reshape_output_0", "/blocks.29/input_layernorm/Mul_1_output_0", "/blocks.29/self_attn/q_proj/FakeLinear_output_0", "/blocks.29/self_attn/Shape_output_0", "Shape3877", "Rank3879", "BinaryOp3881", "Unsqueeze3882", "BinaryOp3884", "Unsqueeze3885", "StridedSlice3888", "Squeeze3889", "BinaryOp3891", "/blocks.29/self_attn/Gather_output_0", "/blocks.29/self_attn/Unsqueeze_output_0", "Unsqueeze3899", "Unsqueeze3902", "StridedSlice3905", "Squeeze3906", "BinaryOp3907", "BinaryOp3908", "/blocks.29/self_attn/Gather_1_output_0", "/blocks.29/self_attn/Unsqueeze_1_output_0", "/blocks.29/self_attn/Concat_output_0", "/blocks.29/self_attn/Reshape_output_0", "/blocks.29/self_attn/Mul_output_0", "/blocks.29/self_attn/Shape_2_output_0", "Shape3915", "Rank3917", "BinaryOp3919", "Unsqueeze3920", "BinaryOp3922", "Unsqueeze3923", "StridedSlice3926", "Squeeze3927", "BinaryOp3928", "BinaryOp3929", "/blocks.29/self_attn/Gather_2_output_0", "/blocks.29/self_attn/Div_output_0", "/blocks.29/self_attn/Unsqueeze_7_output_0", "/blocks.29/self_attn/Slice_1_output_0", "/blocks.29/self_attn/Neg_output_0", "/blocks.29/self_attn/Unsqueeze_6_output_0", "/blocks.29/self_attn/Slice_output_0", "/blocks.29/self_attn/Concat_3_output_0", "/blocks.29/self_attn/Mul_1_output_0", "/blocks.29/self_attn/Add_output_0", "/blocks.29/self_attn/k_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_2_output_0", "/blocks.29/self_attn/Unsqueeze_3_output_0", "/blocks.29/self_attn/Concat_1_output_0", "/blocks.29/self_attn/Reshape_1_output_0", "/blocks.29/self_attn/Mul_2_output_0", "/blocks.29/self_attn/Shape_3_output_0", "Shape3948", "Rank3950", "BinaryOp3952", "Unsqueeze3953", "BinaryOp3955", "Unsqueeze3956", "StridedSlice3959", "Squeeze3960", "BinaryOp3961", "BinaryOp3962", "/blocks.29/self_attn/Gather_3_output_0", "/blocks.29/self_attn/Div_1_output_0", "/blocks.29/self_attn/Unsqueeze_9_output_0", "/blocks.29/self_attn/Slice_3_output_0", "/blocks.29/self_attn/Neg_1_output_0", "/blocks.29/self_attn/Unsqueeze_8_output_0", "/blocks.29/self_attn/Slice_2_output_0", "/blocks.29/self_attn/Concat_4_output_0", "/blocks.29/self_attn/Mul_3_output_0", "/blocks.29/self_attn/Add_1_output_0", "/blocks.29/self_attn/v_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_4_output_0", "/blocks.29/self_attn/Unsqueeze_5_output_0", "/blocks.29/self_attn/Concat_2_output_0", "/blocks.29/self_attn/Reshape_2_output_0", "/blocks.29/self_attn/fused_attn/FusedAttention_output_0", "/blocks.29/self_attn/o_proj/FakeLinear_output_0", "/blocks.29/Add_output_0", "/blocks.29/post_attention_layernorm/Mul_1_output_0", "/blocks.29/mlp/gate_proj/FakeLinear_output_0", "/blocks.29/mlp/act_fn/Mul_output_0", "/blocks.29/mlp/up_proj/FakeLinear_output_0", "/blocks.29/mlp/Mul_output_0", "/blocks.29/mlp/down_proj/FakeLinear_output_0", "/blocks.29/Add_1_output_0", "/blocks.30/Reshape_output_0", "/blocks.30/input_layernorm/Mul_1_output_0", "/blocks.30/self_attn/q_proj/FakeLinear_output_0", "/blocks.30/self_attn/Shape_output_0", "Shape4008", "Rank4010", "BinaryOp4012", "Unsqueeze4013", "BinaryOp4015", "Unsqueeze4016", "StridedSlice4019", "Squeeze4020", "BinaryOp4022", "/blocks.30/self_attn/Gather_output_0", "/blocks.30/self_attn/Unsqueeze_output_0", "Unsqueeze4030", "Unsqueeze4033", "StridedSlice4036", "Squeeze4037", "BinaryOp4038", "BinaryOp4039", "/blocks.30/self_attn/Gather_1_output_0", "/blocks.30/self_attn/Unsqueeze_1_output_0", "/blocks.30/self_attn/Concat_output_0", "/blocks.30/self_attn/Reshape_output_0", "/blocks.30/self_attn/Mul_output_0", "/blocks.30/self_attn/Shape_2_output_0", "Shape4046", "Rank4048", "BinaryOp4050", "Unsqueeze4051", "BinaryOp4053", "Unsqueeze4054", "StridedSlice4057", "Squeeze4058", "BinaryOp4059", "BinaryOp4060", "/blocks.30/self_attn/Gather_2_output_0", "/blocks.30/self_attn/Div_output_0", "/blocks.30/self_attn/Unsqueeze_7_output_0", "/blocks.30/self_attn/Slice_1_output_0", "/blocks.30/self_attn/Neg_output_0", "/blocks.30/self_attn/Unsqueeze_6_output_0", "/blocks.30/self_attn/Slice_output_0", "/blocks.30/self_attn/Concat_3_output_0", "/blocks.30/self_attn/Mul_1_output_0", "/blocks.30/self_attn/Add_output_0", "/blocks.30/self_attn/k_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_2_output_0", "/blocks.30/self_attn/Unsqueeze_3_output_0", "/blocks.30/self_attn/Concat_1_output_0", "/blocks.30/self_attn/Reshape_1_output_0", "/blocks.30/self_attn/Mul_2_output_0", "/blocks.30/self_attn/Shape_3_output_0", "Shape4079", "Rank4081", "BinaryOp4083", "Unsqueeze4084", "BinaryOp4086", "Unsqueeze4087", "StridedSlice4090", "Squeeze4091", "BinaryOp4092", "BinaryOp4093", "/blocks.30/self_attn/Gather_3_output_0", "/blocks.30/self_attn/Div_1_output_0", "/blocks.30/self_attn/Unsqueeze_9_output_0", "/blocks.30/self_attn/Slice_3_output_0", "/blocks.30/self_attn/Neg_1_output_0", "/blocks.30/self_attn/Unsqueeze_8_output_0", "/blocks.30/self_attn/Slice_2_output_0", "/blocks.30/self_attn/Concat_4_output_0", "/blocks.30/self_attn/Mul_3_output_0", "/blocks.30/self_attn/Add_1_output_0", "/blocks.30/self_attn/v_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_4_output_0", "/blocks.30/self_attn/Unsqueeze_5_output_0", "/blocks.30/self_attn/Concat_2_output_0", "/blocks.30/self_attn/Reshape_2_output_0", "/blocks.30/self_attn/fused_attn/FusedAttention_output_0", "/blocks.30/self_attn/o_proj/FakeLinear_output_0", "/blocks.30/Add_output_0", "/blocks.30/post_attention_layernorm/Mul_1_output_0", "/blocks.30/mlp/gate_proj/FakeLinear_output_0", "/blocks.30/mlp/act_fn/Mul_output_0", "/blocks.30/mlp/up_proj/FakeLinear_output_0", "/blocks.30/mlp/Mul_output_0", "/blocks.30/mlp/down_proj/FakeLinear_output_0", "/blocks.30/Add_1_output_0", "/blocks.31/Reshape_output_0", "/blocks.31/input_layernorm/Mul_1_output_0", "/blocks.31/self_attn/q_proj/FakeLinear_output_0", "/blocks.31/self_attn/Shape_output_0", "Shape4139", "Rank4141", "BinaryOp4143", "Unsqueeze4144", "BinaryOp4146", "Unsqueeze4147", "StridedSlice4150", "Squeeze4151", "BinaryOp4153", "/blocks.31/self_attn/Gather_output_0", "/blocks.31/self_attn/Unsqueeze_output_0", "Unsqueeze4161", "Unsqueeze4164", "StridedSlice4167", "Squeeze4168", "BinaryOp4169", "BinaryOp4170", "/blocks.31/self_attn/Gather_1_output_0", "/blocks.31/self_attn/Unsqueeze_1_output_0", "/blocks.31/self_attn/Concat_output_0", "/blocks.31/self_attn/Reshape_output_0", "/blocks.31/self_attn/Mul_output_0", "/blocks.31/self_attn/Shape_2_output_0", "Shape4177", "Rank4179", "BinaryOp4181", "Unsqueeze4182", "BinaryOp4184", "Unsqueeze4185", "StridedSlice4188", "Squeeze4189", "BinaryOp4190", "BinaryOp4191", "/blocks.31/self_attn/Gather_2_output_0", "/blocks.31/self_attn/Div_output_0", "/blocks.31/self_attn/Unsqueeze_7_output_0", "/blocks.31/self_attn/Slice_1_output_0", "/blocks.31/self_attn/Neg_output_0", "/blocks.31/self_attn/Unsqueeze_6_output_0", "/blocks.31/self_attn/Slice_output_0", "/blocks.31/self_attn/Concat_3_output_0", "/blocks.31/self_attn/Mul_1_output_0", "/blocks.31/self_attn/Add_output_0", "/blocks.31/self_attn/k_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_2_output_0", "/blocks.31/self_attn/Unsqueeze_3_output_0", "/blocks.31/self_attn/Concat_1_output_0", "/blocks.31/self_attn/Reshape_1_output_0", "/blocks.31/self_attn/Mul_2_output_0", "/blocks.31/self_attn/Shape_3_output_0", "Shape4210", "Rank4212", "BinaryOp4214", "Unsqueeze4215", "BinaryOp4217", "Unsqueeze4218", "StridedSlice4221", "Squeeze4222", "BinaryOp4223", "BinaryOp4224", "/blocks.31/self_attn/Gather_3_output_0", "/blocks.31/self_attn/Div_1_output_0", "/blocks.31/self_attn/Unsqueeze_9_output_0", "/blocks.31/self_attn/Slice_3_output_0", "/blocks.31/self_attn/Neg_1_output_0", "/blocks.31/self_attn/Unsqueeze_8_output_0", "/blocks.31/self_attn/Slice_2_output_0", "/blocks.31/self_attn/Concat_4_output_0", "/blocks.31/self_attn/Mul_3_output_0", "/blocks.31/self_attn/Add_1_output_0", "/blocks.31/self_attn/v_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_4_output_0", "/blocks.31/self_attn/Unsqueeze_5_output_0", "/blocks.31/self_attn/Concat_2_output_0", "/blocks.31/self_attn/Reshape_2_output_0", "/blocks.31/self_attn/fused_attn/FusedAttention_output_0", "/blocks.31/self_attn/o_proj/FakeLinear_output_0", "/blocks.31/Add_output_0", "/blocks.31/post_attention_layernorm/Mul_1_output_0", "/blocks.31/mlp/gate_proj/FakeLinear_output_0", "/blocks.31/mlp/act_fn/Mul_output_0", "/blocks.31/mlp/up_proj/FakeLinear_output_0", "/blocks.31/mlp/Mul_output_0", "/blocks.31/mlp/down_proj/FakeLinear_output_0", "/blocks.31/Add_1_output_0", "/Slice_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/layers.28/self_attn/q_proj/Linear/pre_reshape", "/layers.28/self_attn/q_proj/Linear/pre_convert", "/layers.28/self_attn/q_proj/Linear", "/layers.28/self_attn/q_proj/Linear/post_convert", "/layers.28/self_attn/k_proj/Linear/pre_reshape", "/layers.28/self_attn/k_proj/Linear/pre_convert", "/layers.28/self_attn/k_proj/Linear", "/layers.28/self_attn/k_proj/Linear/post_convert", "/layers.28/self_attn/v_proj/Linear/pre_reshape", "/layers.28/self_attn/v_proj/Linear/pre_convert", "/layers.28/self_attn/v_proj/Linear", "/layers.28/self_attn/v_proj/Linear/post_convert", "/layers.28/self_attn/o_proj/Linear/pre_reshape", "/layers.28/self_attn/o_proj/Linear/pre_convert", "/layers.28/self_attn/o_proj/Linear", "/layers.28/self_attn/o_proj/Linear/post_convert", "/layers.28/mlp/gate_proj/Linear/pre_reshape", "/layers.28/mlp/gate_proj/Linear/pre_convert", "/layers.28/mlp/gate_proj/Linear", "/layers.28/mlp/gate_proj/Linear/post_convert", "/layers.28/mlp/up_proj/Linear/pre_reshape", "/layers.28/mlp/up_proj/Linear/pre_convert", "/layers.28/mlp/up_proj/Linear", "/layers.28/mlp/up_proj/Linear/post_convert", "/layers.28/mlp/down_proj/Linear/pre_reshape", "/layers.28/mlp/down_proj/Linear/pre_convert", "/layers.28/mlp/down_proj/Linear", "/layers.28/mlp/down_proj/Linear/post_convert", "/layers.29/self_attn/q_proj/Linear/pre_reshape", "/layers.29/self_attn/q_proj/Linear/pre_convert", "/layers.29/self_attn/q_proj/Linear", "/layers.29/self_attn/q_proj/Linear/post_convert", "/layers.29/self_attn/k_proj/Linear/pre_reshape", "/layers.29/self_attn/k_proj/Linear/pre_convert", "/layers.29/self_attn/k_proj/Linear", "/layers.29/self_attn/k_proj/Linear/post_convert", "/layers.29/self_attn/v_proj/Linear/pre_reshape", "/layers.29/self_attn/v_proj/Linear/pre_convert", "/layers.29/self_attn/v_proj/Linear", "/layers.29/self_attn/v_proj/Linear/post_convert", "/layers.29/self_attn/o_proj/Linear/pre_reshape", "/layers.29/self_attn/o_proj/Linear/pre_convert", "/layers.29/self_attn/o_proj/Linear", "/layers.29/self_attn/o_proj/Linear/post_convert", "/layers.29/mlp/gate_proj/Linear/pre_reshape", "/layers.29/mlp/gate_proj/Linear/pre_convert", "/layers.29/mlp/gate_proj/Linear", "/layers.29/mlp/gate_proj/Linear/post_convert", "/layers.29/mlp/up_proj/Linear/pre_reshape", "/layers.29/mlp/up_proj/Linear/pre_convert", "/layers.29/mlp/up_proj/Linear", "/layers.29/mlp/up_proj/Linear/post_convert", "/layers.29/mlp/down_proj/Linear/pre_reshape", "/layers.29/mlp/down_proj/Linear/pre_convert", "/layers.29/mlp/down_proj/Linear", "/layers.29/mlp/down_proj/Linear/post_convert", "/layers.30/self_attn/q_proj/Linear/pre_reshape", "/layers.30/self_attn/q_proj/Linear/pre_convert", "/layers.30/self_attn/q_proj/Linear", "/layers.30/self_attn/q_proj/Linear/post_convert", "/layers.30/self_attn/k_proj/Linear/pre_reshape", "/layers.30/self_attn/k_proj/Linear/pre_convert", "/layers.30/self_attn/k_proj/Linear", "/layers.30/self_attn/k_proj/Linear/post_convert", "/layers.30/self_attn/v_proj/Linear/pre_reshape", "/layers.30/self_attn/v_proj/Linear/pre_convert", "/layers.30/self_attn/v_proj/Linear", "/layers.30/self_attn/v_proj/Linear/post_convert", "/layers.30/self_attn/o_proj/Linear/pre_reshape", "/layers.30/self_attn/o_proj/Linear/pre_convert", "/layers.30/self_attn/o_proj/Linear", "/layers.30/self_attn/o_proj/Linear/post_convert", "/layers.30/mlp/gate_proj/Linear/pre_reshape", "/layers.30/mlp/gate_proj/Linear/pre_convert", "/layers.30/mlp/gate_proj/Linear", "/layers.30/mlp/gate_proj/Linear/post_convert", "/layers.30/mlp/up_proj/Linear/pre_reshape", "/layers.30/mlp/up_proj/Linear/pre_convert", "/layers.30/mlp/up_proj/Linear", "/layers.30/mlp/up_proj/Linear/post_convert", "/layers.30/mlp/down_proj/Linear/pre_reshape", "/layers.30/mlp/down_proj/Linear/pre_convert", "/layers.30/mlp/down_proj/Linear", "/layers.30/mlp/down_proj/Linear/post_convert", "/layers.31/self_attn/q_proj/Linear/pre_reshape", "/layers.31/self_attn/q_proj/Linear/pre_convert", "/layers.31/self_attn/q_proj/Linear", "/layers.31/self_attn/q_proj/Linear/post_convert", "/layers.31/self_attn/k_proj/Linear/pre_reshape", "/layers.31/self_attn/k_proj/Linear/pre_convert", "/layers.31/self_attn/k_proj/Linear", "/layers.31/self_attn/k_proj/Linear/post_convert", "/layers.31/self_attn/v_proj/Linear/pre_reshape", "/layers.31/self_attn/v_proj/Linear/pre_convert", "/layers.31/self_attn/v_proj/Linear", "/layers.31/self_attn/v_proj/Linear/post_convert", "/layers.31/self_attn/o_proj/Linear/pre_reshape", "/layers.31/self_attn/o_proj/Linear/pre_convert", "/layers.31/self_attn/o_proj/Linear", "/layers.31/self_attn/o_proj/Linear/post_convert", "/layers.31/mlp/gate_proj/Linear/pre_reshape", "/layers.31/mlp/gate_proj/Linear/pre_convert", "/layers.31/mlp/gate_proj/Linear", "/layers.31/mlp/gate_proj/Linear/post_convert", "/layers.31/mlp/up_proj/Linear/pre_reshape", "/layers.31/mlp/up_proj/Linear/pre_convert", "/layers.31/mlp/up_proj/Linear", "/layers.31/mlp/up_proj/Linear/post_convert", "/layers.31/mlp/down_proj/Linear/pre_reshape", "/layers.31/mlp/down_proj/Linear/pre_convert", "/layers.31/mlp/down_proj/Linear", "/layers.31/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] +, "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "b5d3c965-61d1-4789-976f-2af4a7ee5170" }