{ "bizCode": "MNNTest", "extraInfo": { "version": "3.4.0" } , "oplists": [ { "main_type": "Input", "main": { "dims": [ 1, 1, 4096 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "input_ids", "outputIndexes": [ 2 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "attention_mask", "outputIndexes": [ 124 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "position_ids", "outputIndexes": [ 0 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "logits_index", "outputIndexes": [ 1 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 3 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1, -1, 4096 ] } , "name": "/blocks.0/Constant_output_0", "outputIndexes": [ 3 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/Reshape_output_0", "outputIndexes": [ 4 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 0, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.0/input_layernorm/Mul_1_output_0", "outputIndexes": [ 5 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 5 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2897 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2897 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2898 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2898 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 32768, 8388630, 1048576, 0, 0 ] } , "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": [ 2899 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2900 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 6 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 5 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_output_0", "outputIndexes": [ 7 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "Shape21", "outputIndexes": [ 8 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "Rank23", "outputIndexes": [ 9 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 9 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp25", "outputIndexes": [ 10 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze26", "outputIndexes": [ 11 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Const27", "outputIndexes": [ 12 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp28", "outputIndexes": [ 13 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 13 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze29", "outputIndexes": [ 14 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Unsqueeze31", "outputIndexes": [ 15 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 11, 14, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice32", "outputIndexes": [ 16 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 16 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze33", "outputIndexes": [ 17 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 17, 17 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp35", "outputIndexes": [ 18 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7, 18, 10 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_output_0", "outputIndexes": [ 19 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 0 ] } , "name": "/rotary/Constant_3_output_0", "outputIndexes": [ 20 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_output_0", "outputIndexes": [ 21 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze45", "outputIndexes": [ 22 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 13 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze48", "outputIndexes": [ 23 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 22, 23, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice51", "outputIndexes": [ 24 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 24 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze52", "outputIndexes": [ 25 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 25 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp53", "outputIndexes": [ 26 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 26, 25 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp54", "outputIndexes": [ 27 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7, 27, 10 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_1_output_0", "outputIndexes": [ 28 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 29 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 32 ] } , "name": "/blocks.0/self_attn/Constant_2_output_0", "outputIndexes": [ 30 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 128 ] } , "name": "/blocks.0/self_attn/Constant_3_output_0", "outputIndexes": [ 31 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 29, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_output_0", "outputIndexes": [ 32 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6, 32 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_output_0", "outputIndexes": [ 33 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 0 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "name": "/rotary/Cast_output_0", "outputIndexes": [ 34 ] , "type": "Cast", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 2 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ -1, 1 ] } , "name": "/rotary/Constant_output_0", "outputIndexes": [ 35 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 34, 35 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/rotary/Reshape_output_0", "outputIndexes": [ 36 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 64 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.0, 0.814617, 0.663601, 0.540581, 0.440367, 0.35873, 0.292228, 0.238054, 0.193923, 0.157973, 0.128687, 0.104831, 0.085397, 0.069566, 0.05667, 0.046164, 0.037606, 0.030635, 0.024955, 0.020329, 0.01656, 0.01349, 0.01099, 0.008952, 0.007293, 0.005941, 0.004839, 0.003942, 0.003211, 0.002616, 0.002131, 0.001736, 0.001414, 0.001152, 0.000938, 0.000764, 0.000623, 0.000507, 0.000413, 0.000337, 0.000274, 0.000223, 0.000182, 0.000148, 0.000121, 0.000098, 0.00008, 0.000065, 0.000053, 0.000043, 0.000035, 0.000029, 0.000023, 0.000019, 0.000016, 0.000013, 0.00001, 0.000008, 0.000007, 0.000006, 0.000005, 0.000004, 0.000003, 0.000002 ] } , "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 37 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 36, 37 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_output_0", "outputIndexes": [ 38 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 38 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "name": "/rotary/Cos_output_0", "outputIndexes": [ 39 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 39, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_output_0", "outputIndexes": [ 40 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 38 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "name": "/rotary/Sin_output_0", "outputIndexes": [ 41 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": [ 42 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40, 42 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/rotary/Concat_output_0", "outputIndexes": [ 43 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43, 43 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_1_output_0", "outputIndexes": [ 44 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_5_output_0", "outputIndexes": [ 45 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 44, 45 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": [ 46 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 46, 15 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": [ 47 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 47 ] , "main_type": "NONE", "name": "Shape76", "outputIndexes": [ 48 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 47 ] , "main_type": "NONE", "name": "Rank78", "outputIndexes": [ 49 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 49 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp80", "outputIndexes": [ 50 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze81", "outputIndexes": [ 51 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp83", "outputIndexes": [ 52 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze84", "outputIndexes": [ 53 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 51, 53, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice87", "outputIndexes": [ 54 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 54 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze88", "outputIndexes": [ 55 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 55, 55 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp90", "outputIndexes": [ 56 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 47, 56, 50 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_2_output_0", "outputIndexes": [ 57 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_output_0", "outputIndexes": [ 58 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_2_output_0", "outputIndexes": [ 59 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_8_output_0", "outputIndexes": [ 60 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 59 ] , "main_type": "NONE", "name": "Shape95", "outputIndexes": [ 61 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 59 ] , "main_type": "NONE", "name": "Rank97", "outputIndexes": [ 62 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 62 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp99", "outputIndexes": [ 63 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 63 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze100", "outputIndexes": [ 64 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 63, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp102", "outputIndexes": [ 65 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze103", "outputIndexes": [ 66 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 64, 66, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice106", "outputIndexes": [ 67 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 67 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze107", "outputIndexes": [ 68 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 68 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp108", "outputIndexes": [ 69 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 69, 68 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp109", "outputIndexes": [ 70 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 59, 70, 63 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_4_output_0", "outputIndexes": [ 71 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/blocks.0/self_attn/Constant_9_output_0", "outputIndexes": [ 72 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 71, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_output_0", "outputIndexes": [ 73 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 73, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 74 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1073741824 ] } , "name": "/blocks.0/self_attn/Constant_16_output_0", "outputIndexes": [ 75 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/blocks.0/self_attn/Constant_10_output_0", "outputIndexes": [ 76 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33, 74, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_1_output_0", "outputIndexes": [ 77 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 77 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_output_0", "outputIndexes": [ 78 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 73, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 79 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33, 20, 79, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_output_0", "outputIndexes": [ 80 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 78, 80 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_3_output_0", "outputIndexes": [ 81 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze127", "outputIndexes": [ 82 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze130", "outputIndexes": [ 83 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 82, 83, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice133", "outputIndexes": [ 84 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 84 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze134", "outputIndexes": [ 85 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 85 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp135", "outputIndexes": [ 86 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 86, 85 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp136", "outputIndexes": [ 87 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 47, 87, 50 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_3_output_0", "outputIndexes": [ 88 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 81, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_1_output_0", "outputIndexes": [ 89 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 58, 89 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_output_0", "outputIndexes": [ 90 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2898 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9469974, 2097174, 262144, 0, 0 ] } , "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": [ 2903 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2903 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2904 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2904 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 91 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 92 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 93 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 8 ] } , "name": "/blocks.0/self_attn/Constant_4_output_0", "outputIndexes": [ 94 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 92, 93, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_1_output_0", "outputIndexes": [ 95 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 91, 95 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_1_output_0", "outputIndexes": [ 96 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_2_output_0", "outputIndexes": [ 97 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96 ] , "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_3_output_0", "outputIndexes": [ 98 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 98 ] , "main_type": "NONE", "name": "Shape148", "outputIndexes": [ 99 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 98 ] , "main_type": "NONE", "name": "Rank150", "outputIndexes": [ 100 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100, 100 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp152", "outputIndexes": [ 101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze153", "outputIndexes": [ 102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp155", "outputIndexes": [ 103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze156", "outputIndexes": [ 104 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 99, 102, 104, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice159", "outputIndexes": [ 105 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze160", "outputIndexes": [ 106 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 106 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp161", "outputIndexes": [ 107 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 107, 106 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp162", "outputIndexes": [ 108 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98, 108, 101 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.0/self_attn/Gather_5_output_0", "outputIndexes": [ 109 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 109, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Div_1_output_0", "outputIndexes": [ 110 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 110, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 111 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 111, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_3_output_0", "outputIndexes": [ 112 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 112 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.0/self_attn/Neg_1_output_0", "outputIndexes": [ 113 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 110, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 114 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 20, 114, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.0/self_attn/Slice_2_output_0", "outputIndexes": [ 115 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 113, 115 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.0/self_attn/Concat_4_output_0", "outputIndexes": [ 116 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 116, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Mul_3_output_0", "outputIndexes": [ 117 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 97, 117 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/self_attn/Add_1_output_0", "outputIndexes": [ 118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2898 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 11829292, 2097174, 262144, 0, 0 ] } , "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": [ 2907 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2907 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2908 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2908 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 119 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 120 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.0/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 121 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 120, 121, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.0/self_attn/Concat_2_output_0", "outputIndexes": [ 122 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 119, 122 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.0/self_attn/Reshape_2_output_0", "outputIndexes": [ 123 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 90, 118, 123, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.0/self_attn/FusedAttention", "outputIndexes": [ 125 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 125 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2909 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2909 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2910 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2910 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 14188610, 8388630, 1048576, 0, 0 ] } , "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": [ 2911 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2911 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2912 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 126 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4, 126 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_output_0", "outputIndexes": [ 127 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 127 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 23625816, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.0/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 128 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 128 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2913 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2913 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2914 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2914 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 23658584, 29360150, 3670016, 0, 0 ] } , "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": [ 2915 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2915 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2916 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 129 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 129 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.0/mlp/act_fn/Mul_output_0", "outputIndexes": [ 130 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2914 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56688750, 29360150, 3670016, 0, 0 ] } , "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": [ 2919 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2919 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2920 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2920 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 131 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 130, 131 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/mlp/Mul_output_0", "outputIndexes": [ 132 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 132 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2921 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2922 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2922 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 89718916, 29360150, 3670016, 0, 0 ] } , "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": [ 2923 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2923 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2924 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2924 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 133 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 127, 133 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.0/Add_1_output_0", "outputIndexes": [ 134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 134, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/Reshape_output_0", "outputIndexes": [ 135 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 122749082, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.1/input_layernorm/Mul_1_output_0", "outputIndexes": [ 136 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2925 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2926 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2926 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 122781850, 8388630, 1048576, 0, 0 ] } , "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": [ 2927 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2927 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2928 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 137 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_output_0", "outputIndexes": [ 138 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 138 ] , "main_type": "NONE", "name": "Shape209", "outputIndexes": [ 139 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 138 ] , "main_type": "NONE", "name": "Rank211", "outputIndexes": [ 140 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140, 140 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp213", "outputIndexes": [ 141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze214", "outputIndexes": [ 142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp216", "outputIndexes": [ 143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze217", "outputIndexes": [ 144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139, 142, 144, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice220", "outputIndexes": [ 145 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze221", "outputIndexes": [ 146 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 146, 146 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp223", "outputIndexes": [ 147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138, 147, 141 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_output_0", "outputIndexes": [ 148 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_output_0", "outputIndexes": [ 149 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze231", "outputIndexes": [ 150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze234", "outputIndexes": [ 151 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139, 150, 151, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice237", "outputIndexes": [ 152 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 152 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze238", "outputIndexes": [ 153 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 153 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp239", "outputIndexes": [ 154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 154, 153 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp240", "outputIndexes": [ 155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138, 155, 141 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_1_output_0", "outputIndexes": [ 156 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 157 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 149, 157, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_output_0", "outputIndexes": [ 158 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 137, 158 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_output_0", "outputIndexes": [ 159 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_output_0", "outputIndexes": [ 160 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_2_output_0", "outputIndexes": [ 161 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 161 ] , "main_type": "NONE", "name": "Shape247", "outputIndexes": [ 162 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 161 ] , "main_type": "NONE", "name": "Rank249", "outputIndexes": [ 163 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 163, 163 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp251", "outputIndexes": [ 164 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze252", "outputIndexes": [ 165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp254", "outputIndexes": [ 166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 166 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze255", "outputIndexes": [ 167 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 162, 165, 167, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice258", "outputIndexes": [ 168 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 168 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze259", "outputIndexes": [ 169 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 169 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp260", "outputIndexes": [ 170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170, 169 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp261", "outputIndexes": [ 171 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 161, 171, 164 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_2_output_0", "outputIndexes": [ 172 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 172, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_output_0", "outputIndexes": [ 173 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 174 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159, 174, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_1_output_0", "outputIndexes": [ 175 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_output_0", "outputIndexes": [ 176 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 177 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159, 20, 177, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_output_0", "outputIndexes": [ 178 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 176, 178 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_3_output_0", "outputIndexes": [ 179 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 179, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_1_output_0", "outputIndexes": [ 180 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160, 180 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_output_0", "outputIndexes": [ 181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2926 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 132219056, 2097174, 262144, 0, 0 ] } , "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": [ 2931 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2931 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2932 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2932 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 182 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 184 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 183, 184, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_1_output_0", "outputIndexes": [ 185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 182, 185 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_1_output_0", "outputIndexes": [ 186 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_2_output_0", "outputIndexes": [ 187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186 ] , "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_3_output_0", "outputIndexes": [ 188 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 188 ] , "main_type": "NONE", "name": "Shape280", "outputIndexes": [ 189 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 188 ] , "main_type": "NONE", "name": "Rank282", "outputIndexes": [ 190 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 190, 190 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp284", "outputIndexes": [ 191 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 191 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze285", "outputIndexes": [ 192 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 191, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp287", "outputIndexes": [ 193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 193 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze288", "outputIndexes": [ 194 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 189, 192, 194, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice291", "outputIndexes": [ 195 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze292", "outputIndexes": [ 196 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 196 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp293", "outputIndexes": [ 197 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 197, 196 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp294", "outputIndexes": [ 198 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 198, 191 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.1/self_attn/Gather_3_output_0", "outputIndexes": [ 199 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 199, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Div_1_output_0", "outputIndexes": [ 200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 200, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 201 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 201, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_3_output_0", "outputIndexes": [ 202 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 202 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.1/self_attn/Neg_1_output_0", "outputIndexes": [ 203 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 200, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 204 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 20, 204, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.1/self_attn/Slice_2_output_0", "outputIndexes": [ 205 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 203, 205 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.1/self_attn/Concat_4_output_0", "outputIndexes": [ 206 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 206, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Mul_3_output_0", "outputIndexes": [ 207 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 187, 207 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/self_attn/Add_1_output_0", "outputIndexes": [ 208 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2926 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 134578374, 2097174, 262144, 0, 0 ] } , "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": [ 2935 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2935 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2936 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2936 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 209 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 210 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.1/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 211 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 210, 211, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.1/self_attn/Concat_2_output_0", "outputIndexes": [ 212 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 209, 212 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.1/self_attn/Reshape_2_output_0", "outputIndexes": [ 213 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 181, 208, 213, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.1/self_attn/FusedAttention", "outputIndexes": [ 214 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 214 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2937 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2937 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2938 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2938 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 136937692, 8388630, 1048576, 0, 0 ] } , "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": [ 2939 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2939 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2940 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2940 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 215 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135, 215 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_output_0", "outputIndexes": [ 216 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 146374898, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.1/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 217 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 217 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2941 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2941 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2942 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2942 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 146407666, 29360150, 3670016, 0, 0 ] } , "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": [ 2943 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2943 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2944 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2944 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 218 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 218 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.1/mlp/act_fn/Mul_output_0", "outputIndexes": [ 219 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2942 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 179437832, 29360150, 3670016, 0, 0 ] } , "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": [ 2947 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2947 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2948 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2948 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 220 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 219, 220 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/mlp/Mul_output_0", "outputIndexes": [ 221 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 221 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2949 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2949 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2950 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 212467998, 29360150, 3670016, 0, 0 ] } , "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": [ 2951 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2951 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2952 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2952 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 222 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216, 222 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.1/Add_1_output_0", "outputIndexes": [ 223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 223, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/Reshape_output_0", "outputIndexes": [ 224 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 245498164, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.2/input_layernorm/Mul_1_output_0", "outputIndexes": [ 225 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2953 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2953 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2954 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2954 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 245530932, 8388630, 1048576, 0, 0 ] } , "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": [ 2955 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2955 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2956 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2956 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 226 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_output_0", "outputIndexes": [ 227 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 227 ] , "main_type": "NONE", "name": "Shape340", "outputIndexes": [ 228 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 227 ] , "main_type": "NONE", "name": "Rank342", "outputIndexes": [ 229 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 229, 229 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp344", "outputIndexes": [ 230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze345", "outputIndexes": [ 231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp347", "outputIndexes": [ 232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze348", "outputIndexes": [ 233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 231, 233, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice351", "outputIndexes": [ 234 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 234 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze352", "outputIndexes": [ 235 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 235, 235 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp354", "outputIndexes": [ 236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227, 236, 230 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_output_0", "outputIndexes": [ 237 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_output_0", "outputIndexes": [ 238 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze362", "outputIndexes": [ 239 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze365", "outputIndexes": [ 240 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 239, 240, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice368", "outputIndexes": [ 241 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 241 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze369", "outputIndexes": [ 242 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 242 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp370", "outputIndexes": [ 243 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 243, 242 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp371", "outputIndexes": [ 244 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227, 244, 230 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_1_output_0", "outputIndexes": [ 245 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 246 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 238, 246, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_output_0", "outputIndexes": [ 247 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 226, 247 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_output_0", "outputIndexes": [ 248 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_output_0", "outputIndexes": [ 249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_2_output_0", "outputIndexes": [ 250 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 250 ] , "main_type": "NONE", "name": "Shape378", "outputIndexes": [ 251 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 250 ] , "main_type": "NONE", "name": "Rank380", "outputIndexes": [ 252 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 252, 252 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp382", "outputIndexes": [ 253 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze383", "outputIndexes": [ 254 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp385", "outputIndexes": [ 255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze386", "outputIndexes": [ 256 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 254, 256, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice389", "outputIndexes": [ 257 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 257 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze390", "outputIndexes": [ 258 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 258 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp391", "outputIndexes": [ 259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 259, 258 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp392", "outputIndexes": [ 260 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250, 260, 253 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_2_output_0", "outputIndexes": [ 261 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 261, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_output_0", "outputIndexes": [ 262 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 263 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 263, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_1_output_0", "outputIndexes": [ 264 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 264 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_output_0", "outputIndexes": [ 265 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 266 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 20, 266, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_output_0", "outputIndexes": [ 267 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 265, 267 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_3_output_0", "outputIndexes": [ 268 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 268, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_1_output_0", "outputIndexes": [ 269 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 249, 269 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_output_0", "outputIndexes": [ 270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2954 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 254968138, 2097174, 262144, 0, 0 ] } , "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": [ 2959 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2959 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2960 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2960 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 271 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 272 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 273 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 272, 273, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_1_output_0", "outputIndexes": [ 274 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 271, 274 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_1_output_0", "outputIndexes": [ 275 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_2_output_0", "outputIndexes": [ 276 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275 ] , "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_3_output_0", "outputIndexes": [ 277 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 277 ] , "main_type": "NONE", "name": "Shape411", "outputIndexes": [ 278 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 277 ] , "main_type": "NONE", "name": "Rank413", "outputIndexes": [ 279 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 279, 279 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp415", "outputIndexes": [ 280 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 280 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze416", "outputIndexes": [ 281 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 280, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp418", "outputIndexes": [ 282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze419", "outputIndexes": [ 283 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 278, 281, 283, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice422", "outputIndexes": [ 284 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 284 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze423", "outputIndexes": [ 285 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 285 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp424", "outputIndexes": [ 286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286, 285 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp425", "outputIndexes": [ 287 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277, 287, 280 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.2/self_attn/Gather_3_output_0", "outputIndexes": [ 288 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 288, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Div_1_output_0", "outputIndexes": [ 289 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 290 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 290, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_3_output_0", "outputIndexes": [ 291 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.2/self_attn/Neg_1_output_0", "outputIndexes": [ 292 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 293 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 20, 293, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.2/self_attn/Slice_2_output_0", "outputIndexes": [ 294 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 292, 294 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.2/self_attn/Concat_4_output_0", "outputIndexes": [ 295 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 295, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Mul_3_output_0", "outputIndexes": [ 296 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 276, 296 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/self_attn/Add_1_output_0", "outputIndexes": [ 297 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2954 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 257327456, 2097174, 262144, 0, 0 ] } , "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": [ 2963 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2963 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2964 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2964 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 298 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.2/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 300 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 299, 300, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.2/self_attn/Concat_2_output_0", "outputIndexes": [ 301 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 298, 301 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.2/self_attn/Reshape_2_output_0", "outputIndexes": [ 302 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 297, 302, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.2/self_attn/FusedAttention", "outputIndexes": [ 303 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 303 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2965 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2965 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2966 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2966 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 259686774, 8388630, 1048576, 0, 0 ] } , "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": [ 2967 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2968 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2968 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 304 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224, 304 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_output_0", "outputIndexes": [ 305 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 305 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 269123980, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.2/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 306 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 306 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2969 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2969 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2970 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2970 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 269156748, 29360150, 3670016, 0, 0 ] } , "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": [ 2971 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2971 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2972 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2972 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 307 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 307 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.2/mlp/act_fn/Mul_output_0", "outputIndexes": [ 308 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2970 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 302186914, 29360150, 3670016, 0, 0 ] } , "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": [ 2975 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2975 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2976 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2976 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 309 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 308, 309 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/mlp/Mul_output_0", "outputIndexes": [ 310 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 310 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2977 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2977 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2978 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2978 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 335217080, 29360150, 3670016, 0, 0 ] } , "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": [ 2979 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2979 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2980 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2980 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 311 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 305, 311 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.2/Add_1_output_0", "outputIndexes": [ 312 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 312, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/Reshape_output_0", "outputIndexes": [ 313 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 313 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 368247246, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.3/input_layernorm/Mul_1_output_0", "outputIndexes": [ 314 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2981 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2981 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2982 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2982 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 368280014, 8388630, 1048576, 0, 0 ] } , "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": [ 2983 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2983 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2984 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2984 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 315 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_output_0", "outputIndexes": [ 316 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 316 ] , "main_type": "NONE", "name": "Shape471", "outputIndexes": [ 317 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 316 ] , "main_type": "NONE", "name": "Rank473", "outputIndexes": [ 318 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318, 318 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp475", "outputIndexes": [ 319 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze476", "outputIndexes": [ 320 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp478", "outputIndexes": [ 321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze479", "outputIndexes": [ 322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 320, 322, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice482", "outputIndexes": [ 323 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 323 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze483", "outputIndexes": [ 324 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 324, 324 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp485", "outputIndexes": [ 325 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316, 325, 319 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_output_0", "outputIndexes": [ 326 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_output_0", "outputIndexes": [ 327 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze493", "outputIndexes": [ 328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze496", "outputIndexes": [ 329 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 328, 329, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice499", "outputIndexes": [ 330 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 330 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze500", "outputIndexes": [ 331 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 331 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp501", "outputIndexes": [ 332 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 332, 331 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp502", "outputIndexes": [ 333 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316, 333, 319 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_1_output_0", "outputIndexes": [ 334 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 335 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 327, 335, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_output_0", "outputIndexes": [ 336 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 315, 336 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_output_0", "outputIndexes": [ 337 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_output_0", "outputIndexes": [ 338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_2_output_0", "outputIndexes": [ 339 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 339 ] , "main_type": "NONE", "name": "Shape509", "outputIndexes": [ 340 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 339 ] , "main_type": "NONE", "name": "Rank511", "outputIndexes": [ 341 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 341, 341 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp513", "outputIndexes": [ 342 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze514", "outputIndexes": [ 343 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp516", "outputIndexes": [ 344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 344 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze517", "outputIndexes": [ 345 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 340, 343, 345, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice520", "outputIndexes": [ 346 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 346 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze521", "outputIndexes": [ 347 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 347 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp522", "outputIndexes": [ 348 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 348, 347 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp523", "outputIndexes": [ 349 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 349, 342 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_2_output_0", "outputIndexes": [ 350 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 350, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_output_0", "outputIndexes": [ 351 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 352 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 352, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_1_output_0", "outputIndexes": [ 353 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 353 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_output_0", "outputIndexes": [ 354 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 355 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 20, 355, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_output_0", "outputIndexes": [ 356 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 354, 356 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_3_output_0", "outputIndexes": [ 357 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 357, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_1_output_0", "outputIndexes": [ 358 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 358 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_output_0", "outputIndexes": [ 359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2982 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 377717220, 2097174, 262144, 0, 0 ] } , "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": [ 2987 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2987 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2988 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2988 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 361 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 362 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361, 362, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_1_output_0", "outputIndexes": [ 363 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 360, 363 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_1_output_0", "outputIndexes": [ 364 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_2_output_0", "outputIndexes": [ 365 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364 ] , "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_3_output_0", "outputIndexes": [ 366 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 366 ] , "main_type": "NONE", "name": "Shape542", "outputIndexes": [ 367 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 366 ] , "main_type": "NONE", "name": "Rank544", "outputIndexes": [ 368 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 368 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp546", "outputIndexes": [ 369 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze547", "outputIndexes": [ 370 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp549", "outputIndexes": [ 371 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 371 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze550", "outputIndexes": [ 372 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 367, 370, 372, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice553", "outputIndexes": [ 373 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 373 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze554", "outputIndexes": [ 374 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 374 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp555", "outputIndexes": [ 375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 375, 374 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp556", "outputIndexes": [ 376 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366, 376, 369 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.3/self_attn/Gather_3_output_0", "outputIndexes": [ 377 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 377, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Div_1_output_0", "outputIndexes": [ 378 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 378, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 379 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 379, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_3_output_0", "outputIndexes": [ 380 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.3/self_attn/Neg_1_output_0", "outputIndexes": [ 381 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 378, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 382 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 20, 382, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.3/self_attn/Slice_2_output_0", "outputIndexes": [ 383 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381, 383 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.3/self_attn/Concat_4_output_0", "outputIndexes": [ 384 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 384, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Mul_3_output_0", "outputIndexes": [ 385 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 365, 385 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/self_attn/Add_1_output_0", "outputIndexes": [ 386 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2982 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 380076538, 2097174, 262144, 0, 0 ] } , "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": [ 2991 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2991 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2992 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2992 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 387 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 388 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.3/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 389 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 388, 389, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.3/self_attn/Concat_2_output_0", "outputIndexes": [ 390 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 387, 390 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.3/self_attn/Reshape_2_output_0", "outputIndexes": [ 391 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 359, 386, 391, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.3/self_attn/FusedAttention", "outputIndexes": [ 392 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 392 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2993 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2993 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2994 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2994 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 382435856, 8388630, 1048576, 0, 0 ] } , "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": [ 2995 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2995 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2996 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2996 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 393 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 313, 393 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_output_0", "outputIndexes": [ 394 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 391873062, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.3/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 395 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 395 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2997 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2997 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2998 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2998 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 391905830, 29360150, 3670016, 0, 0 ] } , "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": [ 2999 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2999 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3000 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3000 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 396 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 396 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.3/mlp/act_fn/Mul_output_0", "outputIndexes": [ 397 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2998 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 424935996, 29360150, 3670016, 0, 0 ] } , "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": [ 3003 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3003 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3004 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3004 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 398 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397, 398 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/mlp/Mul_output_0", "outputIndexes": [ 399 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 399 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3005 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3005 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3006 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3006 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 457966162, 29360150, 3670016, 0, 0 ] } , "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": [ 3007 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3007 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3008 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3008 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 400 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394, 400 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.3/Add_1_output_0", "outputIndexes": [ 401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 401, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/Reshape_output_0", "outputIndexes": [ 402 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 402 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 490996328, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.4/input_layernorm/Mul_1_output_0", "outputIndexes": [ 403 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3009 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3010 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3010 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 491029096, 8388630, 1048576, 0, 0 ] } , "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": [ 3011 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3011 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3012 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3012 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 404 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_output_0", "outputIndexes": [ 405 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 405 ] , "main_type": "NONE", "name": "Shape602", "outputIndexes": [ 406 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 405 ] , "main_type": "NONE", "name": "Rank604", "outputIndexes": [ 407 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 407, 407 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp606", "outputIndexes": [ 408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze607", "outputIndexes": [ 409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp609", "outputIndexes": [ 410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze610", "outputIndexes": [ 411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 406, 409, 411, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice613", "outputIndexes": [ 412 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze614", "outputIndexes": [ 413 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 413, 413 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp616", "outputIndexes": [ 414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 414, 408 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_output_0", "outputIndexes": [ 415 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_output_0", "outputIndexes": [ 416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze624", "outputIndexes": [ 417 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze627", "outputIndexes": [ 418 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 406, 417, 418, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice630", "outputIndexes": [ 419 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 419 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze631", "outputIndexes": [ 420 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 420 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp632", "outputIndexes": [ 421 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421, 420 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp633", "outputIndexes": [ 422 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 422, 408 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_1_output_0", "outputIndexes": [ 423 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 424 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 416, 424, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_output_0", "outputIndexes": [ 425 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 404, 425 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_output_0", "outputIndexes": [ 426 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_output_0", "outputIndexes": [ 427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_2_output_0", "outputIndexes": [ 428 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 428 ] , "main_type": "NONE", "name": "Shape640", "outputIndexes": [ 429 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 428 ] , "main_type": "NONE", "name": "Rank642", "outputIndexes": [ 430 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 430, 430 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp644", "outputIndexes": [ 431 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze645", "outputIndexes": [ 432 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp647", "outputIndexes": [ 433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 433 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze648", "outputIndexes": [ 434 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 429, 432, 434, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice651", "outputIndexes": [ 435 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 435 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze652", "outputIndexes": [ 436 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 436 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp653", "outputIndexes": [ 437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437, 436 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp654", "outputIndexes": [ 438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428, 438, 431 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_2_output_0", "outputIndexes": [ 439 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_output_0", "outputIndexes": [ 440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 440, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 441 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 441, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_1_output_0", "outputIndexes": [ 442 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 442 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_output_0", "outputIndexes": [ 443 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 440, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 444 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 20, 444, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_output_0", "outputIndexes": [ 445 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 443, 445 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_3_output_0", "outputIndexes": [ 446 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 446, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_1_output_0", "outputIndexes": [ 447 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 427, 447 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_output_0", "outputIndexes": [ 448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3010 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 500466302, 2097174, 262144, 0, 0 ] } , "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": [ 3015 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3015 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3016 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3016 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 449 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 451 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 450, 451, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_1_output_0", "outputIndexes": [ 452 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 449, 452 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_1_output_0", "outputIndexes": [ 453 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_2_output_0", "outputIndexes": [ 454 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453 ] , "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_3_output_0", "outputIndexes": [ 455 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 455 ] , "main_type": "NONE", "name": "Shape673", "outputIndexes": [ 456 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 455 ] , "main_type": "NONE", "name": "Rank675", "outputIndexes": [ 457 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 457, 457 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp677", "outputIndexes": [ 458 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze678", "outputIndexes": [ 459 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp680", "outputIndexes": [ 460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 460 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze681", "outputIndexes": [ 461 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 456, 459, 461, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice684", "outputIndexes": [ 462 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 462 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze685", "outputIndexes": [ 463 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 463 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp686", "outputIndexes": [ 464 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 464, 463 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp687", "outputIndexes": [ 465 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455, 465, 458 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.4/self_attn/Gather_3_output_0", "outputIndexes": [ 466 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 466, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Div_1_output_0", "outputIndexes": [ 467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 468 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 468, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_3_output_0", "outputIndexes": [ 469 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.4/self_attn/Neg_1_output_0", "outputIndexes": [ 470 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 471 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 20, 471, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.4/self_attn/Slice_2_output_0", "outputIndexes": [ 472 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 470, 472 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.4/self_attn/Concat_4_output_0", "outputIndexes": [ 473 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 473, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Mul_3_output_0", "outputIndexes": [ 474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 454, 474 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/self_attn/Add_1_output_0", "outputIndexes": [ 475 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3010 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 502825620, 2097174, 262144, 0, 0 ] } , "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": [ 3019 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3019 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3020 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3020 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 476 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 477 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.4/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 478 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 477, 478, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.4/self_attn/Concat_2_output_0", "outputIndexes": [ 479 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 476, 479 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.4/self_attn/Reshape_2_output_0", "outputIndexes": [ 480 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 448, 475, 480, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.4/self_attn/FusedAttention", "outputIndexes": [ 481 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 481 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3021 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3021 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3022 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3022 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 505184938, 8388630, 1048576, 0, 0 ] } , "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": [ 3023 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3023 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3024 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3024 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 482 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 402, 482 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_output_0", "outputIndexes": [ 483 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 514622144, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.4/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 484 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 484 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3025 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3025 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3026 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3026 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 514654912, 29360150, 3670016, 0, 0 ] } , "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": [ 3027 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3027 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3028 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3028 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 485 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.4/mlp/act_fn/Mul_output_0", "outputIndexes": [ 486 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3026 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 547685078, 29360150, 3670016, 0, 0 ] } , "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": [ 3031 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3032 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3032 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 487 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 486, 487 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/mlp/Mul_output_0", "outputIndexes": [ 488 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 488 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3033 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3033 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3034 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3034 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 580715244, 29360150, 3670016, 0, 0 ] } , "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": [ 3035 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3035 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3036 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3036 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 489 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483, 489 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.4/Add_1_output_0", "outputIndexes": [ 490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/Reshape_output_0", "outputIndexes": [ 491 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 491 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 613745410, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.5/input_layernorm/Mul_1_output_0", "outputIndexes": [ 492 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 492 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3037 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3037 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3038 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3038 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 613778178, 8388630, 1048576, 0, 0 ] } , "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": [ 3039 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3039 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3040 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3040 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 493 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 492 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_output_0", "outputIndexes": [ 494 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 494 ] , "main_type": "NONE", "name": "Shape733", "outputIndexes": [ 495 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 494 ] , "main_type": "NONE", "name": "Rank735", "outputIndexes": [ 496 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 496 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp737", "outputIndexes": [ 497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze738", "outputIndexes": [ 498 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp740", "outputIndexes": [ 499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze741", "outputIndexes": [ 500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 495, 498, 500, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice744", "outputIndexes": [ 501 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 501 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze745", "outputIndexes": [ 502 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 502, 502 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp747", "outputIndexes": [ 503 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494, 503, 497 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_output_0", "outputIndexes": [ 504 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_output_0", "outputIndexes": [ 505 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze755", "outputIndexes": [ 506 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze758", "outputIndexes": [ 507 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 495, 506, 507, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice761", "outputIndexes": [ 508 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 508 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze762", "outputIndexes": [ 509 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 509 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp763", "outputIndexes": [ 510 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 510, 509 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp764", "outputIndexes": [ 511 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494, 511, 497 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_1_output_0", "outputIndexes": [ 512 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 513 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 505, 513, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_output_0", "outputIndexes": [ 514 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 493, 514 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_output_0", "outputIndexes": [ 515 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_output_0", "outputIndexes": [ 516 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_2_output_0", "outputIndexes": [ 517 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 517 ] , "main_type": "NONE", "name": "Shape771", "outputIndexes": [ 518 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 517 ] , "main_type": "NONE", "name": "Rank773", "outputIndexes": [ 519 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 519, 519 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp775", "outputIndexes": [ 520 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 520 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze776", "outputIndexes": [ 521 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 520, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp778", "outputIndexes": [ 522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 522 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze779", "outputIndexes": [ 523 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 518, 521, 523, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice782", "outputIndexes": [ 524 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze783", "outputIndexes": [ 525 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 525 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp784", "outputIndexes": [ 526 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 526, 525 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp785", "outputIndexes": [ 527 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 527, 520 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_2_output_0", "outputIndexes": [ 528 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 528, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_output_0", "outputIndexes": [ 529 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 530 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 530, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_1_output_0", "outputIndexes": [ 531 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 531 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_output_0", "outputIndexes": [ 532 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 533 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 20, 533, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_output_0", "outputIndexes": [ 534 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 534 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_3_output_0", "outputIndexes": [ 535 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 535, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_1_output_0", "outputIndexes": [ 536 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 516, 536 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_output_0", "outputIndexes": [ 537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3038 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 623215384, 2097174, 262144, 0, 0 ] } , "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": [ 3043 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3043 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3044 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3044 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 538 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 539 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 540 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 539, 540, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_1_output_0", "outputIndexes": [ 541 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 538, 541 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_1_output_0", "outputIndexes": [ 542 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_2_output_0", "outputIndexes": [ 543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542 ] , "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_3_output_0", "outputIndexes": [ 544 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 544 ] , "main_type": "NONE", "name": "Shape804", "outputIndexes": [ 545 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 544 ] , "main_type": "NONE", "name": "Rank806", "outputIndexes": [ 546 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546, 546 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp808", "outputIndexes": [ 547 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 547 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze809", "outputIndexes": [ 548 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 547, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp811", "outputIndexes": [ 549 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 549 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze812", "outputIndexes": [ 550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 545, 548, 550, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice815", "outputIndexes": [ 551 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 551 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze816", "outputIndexes": [ 552 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 552 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp817", "outputIndexes": [ 553 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 553, 552 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp818", "outputIndexes": [ 554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544, 554, 547 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.5/self_attn/Gather_3_output_0", "outputIndexes": [ 555 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 555, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Div_1_output_0", "outputIndexes": [ 556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 556, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 557 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 557, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_3_output_0", "outputIndexes": [ 558 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 558 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.5/self_attn/Neg_1_output_0", "outputIndexes": [ 559 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 556, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 560 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 20, 560, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.5/self_attn/Slice_2_output_0", "outputIndexes": [ 561 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 559, 561 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.5/self_attn/Concat_4_output_0", "outputIndexes": [ 562 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 562, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Mul_3_output_0", "outputIndexes": [ 563 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 543, 563 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/self_attn/Add_1_output_0", "outputIndexes": [ 564 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3038 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 625574702, 2097174, 262144, 0, 0 ] } , "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": [ 3047 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3047 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3048 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3048 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 565 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 566 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.5/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 567 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566, 567, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.5/self_attn/Concat_2_output_0", "outputIndexes": [ 568 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 565, 568 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.5/self_attn/Reshape_2_output_0", "outputIndexes": [ 569 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 564, 569, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.5/self_attn/FusedAttention", "outputIndexes": [ 570 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3049 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3049 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3050 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3050 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 627934020, 8388630, 1048576, 0, 0 ] } , "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": [ 3051 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3051 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3052 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3052 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 571 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 491, 571 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_output_0", "outputIndexes": [ 572 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 637371226, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.5/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 573 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3053 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3053 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3054 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3054 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 637403994, 29360150, 3670016, 0, 0 ] } , "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": [ 3055 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3055 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3056 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3056 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 574 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 574 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.5/mlp/act_fn/Mul_output_0", "outputIndexes": [ 575 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3054 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 670434160, 29360150, 3670016, 0, 0 ] } , "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": [ 3059 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3059 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3060 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3060 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 576 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575, 576 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/mlp/Mul_output_0", "outputIndexes": [ 577 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 577 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3061 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3061 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3062 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3062 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 703464326, 29360150, 3670016, 0, 0 ] } , "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": [ 3063 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3063 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3064 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3064 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 578 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572, 578 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.5/Add_1_output_0", "outputIndexes": [ 579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 579, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/Reshape_output_0", "outputIndexes": [ 580 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 736494492, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.6/input_layernorm/Mul_1_output_0", "outputIndexes": [ 581 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3065 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3065 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3066 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3066 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 736527260, 8388630, 1048576, 0, 0 ] } , "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": [ 3067 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3067 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3068 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3068 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 582 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_output_0", "outputIndexes": [ 583 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 583 ] , "main_type": "NONE", "name": "Shape864", "outputIndexes": [ 584 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 583 ] , "main_type": "NONE", "name": "Rank866", "outputIndexes": [ 585 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 585, 585 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp868", "outputIndexes": [ 586 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze869", "outputIndexes": [ 587 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp871", "outputIndexes": [ 588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze872", "outputIndexes": [ 589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584, 587, 589, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice875", "outputIndexes": [ 590 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 590 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze876", "outputIndexes": [ 591 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 591, 591 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp878", "outputIndexes": [ 592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 592, 586 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_output_0", "outputIndexes": [ 593 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_output_0", "outputIndexes": [ 594 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze886", "outputIndexes": [ 595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze889", "outputIndexes": [ 596 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584, 595, 596, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice892", "outputIndexes": [ 597 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 597 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze893", "outputIndexes": [ 598 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 598 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp894", "outputIndexes": [ 599 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 599, 598 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp895", "outputIndexes": [ 600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 600, 586 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_1_output_0", "outputIndexes": [ 601 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 602 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 594, 602, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_output_0", "outputIndexes": [ 603 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 582, 603 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_output_0", "outputIndexes": [ 604 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_output_0", "outputIndexes": [ 605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_2_output_0", "outputIndexes": [ 606 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 606 ] , "main_type": "NONE", "name": "Shape902", "outputIndexes": [ 607 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 606 ] , "main_type": "NONE", "name": "Rank904", "outputIndexes": [ 608 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 608, 608 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp906", "outputIndexes": [ 609 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze907", "outputIndexes": [ 610 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp909", "outputIndexes": [ 611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 611 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze910", "outputIndexes": [ 612 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 607, 610, 612, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice913", "outputIndexes": [ 613 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 613 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze914", "outputIndexes": [ 614 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 614 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp915", "outputIndexes": [ 615 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 615, 614 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp916", "outputIndexes": [ 616 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606, 616, 609 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_2_output_0", "outputIndexes": [ 617 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 617, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_output_0", "outputIndexes": [ 618 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 618, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 619 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 619, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_1_output_0", "outputIndexes": [ 620 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 620 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_output_0", "outputIndexes": [ 621 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 618, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 622 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 20, 622, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_output_0", "outputIndexes": [ 623 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 621, 623 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_3_output_0", "outputIndexes": [ 624 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 624, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_1_output_0", "outputIndexes": [ 625 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 605, 625 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_output_0", "outputIndexes": [ 626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3066 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 745964466, 2097174, 262144, 0, 0 ] } , "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": [ 3071 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3071 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3072 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3072 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 628 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 629 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 628, 629, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_1_output_0", "outputIndexes": [ 630 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 627, 630 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_1_output_0", "outputIndexes": [ 631 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_2_output_0", "outputIndexes": [ 632 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631 ] , "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_3_output_0", "outputIndexes": [ 633 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 633 ] , "main_type": "NONE", "name": "Shape935", "outputIndexes": [ 634 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 633 ] , "main_type": "NONE", "name": "Rank937", "outputIndexes": [ 635 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 635 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp939", "outputIndexes": [ 636 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze940", "outputIndexes": [ 637 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp942", "outputIndexes": [ 638 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 638 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze943", "outputIndexes": [ 639 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 634, 637, 639, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice946", "outputIndexes": [ 640 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 640 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze947", "outputIndexes": [ 641 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 641 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp948", "outputIndexes": [ 642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 642, 641 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp949", "outputIndexes": [ 643 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633, 643, 636 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.6/self_attn/Gather_3_output_0", "outputIndexes": [ 644 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 644, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Div_1_output_0", "outputIndexes": [ 645 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 645, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 646 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 646, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_3_output_0", "outputIndexes": [ 647 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 647 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.6/self_attn/Neg_1_output_0", "outputIndexes": [ 648 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 645, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 649 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 20, 649, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.6/self_attn/Slice_2_output_0", "outputIndexes": [ 650 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 648, 650 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.6/self_attn/Concat_4_output_0", "outputIndexes": [ 651 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 651, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Mul_3_output_0", "outputIndexes": [ 652 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 632, 652 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/self_attn/Add_1_output_0", "outputIndexes": [ 653 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3066 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 748323784, 2097174, 262144, 0, 0 ] } , "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": [ 3075 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3075 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3076 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3076 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 654 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.6/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 656 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 655, 656, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.6/self_attn/Concat_2_output_0", "outputIndexes": [ 657 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 654, 657 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.6/self_attn/Reshape_2_output_0", "outputIndexes": [ 658 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 626, 653, 658, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.6/self_attn/FusedAttention", "outputIndexes": [ 659 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3077 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3077 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3078 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3078 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 750683102, 8388630, 1048576, 0, 0 ] } , "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": [ 3079 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3079 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3080 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3080 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 660 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 660 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_output_0", "outputIndexes": [ 661 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 661 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 760120308, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.6/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 662 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 662 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3081 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3081 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3082 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3082 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 760153076, 29360150, 3670016, 0, 0 ] } , "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": [ 3083 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3083 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3084 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 663 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.6/mlp/act_fn/Mul_output_0", "outputIndexes": [ 664 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3082 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 793183242, 29360150, 3670016, 0, 0 ] } , "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": [ 3087 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3088 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3088 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664, 665 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/mlp/Mul_output_0", "outputIndexes": [ 666 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3089 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3089 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3090 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3090 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 826213408, 29360150, 3670016, 0, 0 ] } , "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": [ 3091 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3091 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3092 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3092 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 667 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 661, 667 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.6/Add_1_output_0", "outputIndexes": [ 668 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 668, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/Reshape_output_0", "outputIndexes": [ 669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 859243574, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.7/input_layernorm/Mul_1_output_0", "outputIndexes": [ 670 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3093 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3093 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3094 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 859276342, 8388630, 1048576, 0, 0 ] } , "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": [ 3095 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3095 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3096 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3096 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 671 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_output_0", "outputIndexes": [ 672 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 672 ] , "main_type": "NONE", "name": "Shape995", "outputIndexes": [ 673 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 672 ] , "main_type": "NONE", "name": "Rank997", "outputIndexes": [ 674 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674, 674 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp999", "outputIndexes": [ 675 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1000", "outputIndexes": [ 676 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1002", "outputIndexes": [ 677 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1003", "outputIndexes": [ 678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 676, 678, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1006", "outputIndexes": [ 679 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1007", "outputIndexes": [ 680 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 680, 680 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1009", "outputIndexes": [ 681 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672, 681, 675 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_output_0", "outputIndexes": [ 682 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_output_0", "outputIndexes": [ 683 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1017", "outputIndexes": [ 684 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1020", "outputIndexes": [ 685 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 684, 685, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1023", "outputIndexes": [ 686 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 686 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1024", "outputIndexes": [ 687 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 687 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1025", "outputIndexes": [ 688 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 688, 687 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1026", "outputIndexes": [ 689 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672, 689, 675 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_1_output_0", "outputIndexes": [ 690 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 691 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 683, 691, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_output_0", "outputIndexes": [ 692 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 671, 692 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_output_0", "outputIndexes": [ 693 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_output_0", "outputIndexes": [ 694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_2_output_0", "outputIndexes": [ 695 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 695 ] , "main_type": "NONE", "name": "Shape1033", "outputIndexes": [ 696 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 695 ] , "main_type": "NONE", "name": "Rank1035", "outputIndexes": [ 697 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 697, 697 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1037", "outputIndexes": [ 698 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1038", "outputIndexes": [ 699 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1040", "outputIndexes": [ 700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1041", "outputIndexes": [ 701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 696, 699, 701, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1044", "outputIndexes": [ 702 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 702 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1045", "outputIndexes": [ 703 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 703 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1046", "outputIndexes": [ 704 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 704, 703 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1047", "outputIndexes": [ 705 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 695, 705, 698 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_2_output_0", "outputIndexes": [ 706 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 706, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_output_0", "outputIndexes": [ 707 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 707, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 708 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 708, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_1_output_0", "outputIndexes": [ 709 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 709 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_output_0", "outputIndexes": [ 710 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 707, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 711 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 20, 711, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_output_0", "outputIndexes": [ 712 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710, 712 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_3_output_0", "outputIndexes": [ 713 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 713, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_1_output_0", "outputIndexes": [ 714 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694, 714 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_output_0", "outputIndexes": [ 715 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 868713548, 2097174, 262144, 0, 0 ] } , "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": [ 3099 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3099 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3100 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3100 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 716 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 717 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 718 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 717, 718, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_1_output_0", "outputIndexes": [ 719 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 716, 719 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_1_output_0", "outputIndexes": [ 720 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_2_output_0", "outputIndexes": [ 721 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720 ] , "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_3_output_0", "outputIndexes": [ 722 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 722 ] , "main_type": "NONE", "name": "Shape1066", "outputIndexes": [ 723 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 722 ] , "main_type": "NONE", "name": "Rank1068", "outputIndexes": [ 724 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 724, 724 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1070", "outputIndexes": [ 725 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1071", "outputIndexes": [ 726 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1073", "outputIndexes": [ 727 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 727 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1074", "outputIndexes": [ 728 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 726, 728, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1077", "outputIndexes": [ 729 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 729 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1078", "outputIndexes": [ 730 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 730 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1079", "outputIndexes": [ 731 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 731, 730 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1080", "outputIndexes": [ 732 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 732, 725 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.7/self_attn/Gather_3_output_0", "outputIndexes": [ 733 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 733, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Div_1_output_0", "outputIndexes": [ 734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 735 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 735, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_3_output_0", "outputIndexes": [ 736 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 736 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.7/self_attn/Neg_1_output_0", "outputIndexes": [ 737 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 738 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 20, 738, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.7/self_attn/Slice_2_output_0", "outputIndexes": [ 739 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 737, 739 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.7/self_attn/Concat_4_output_0", "outputIndexes": [ 740 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 740, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Mul_3_output_0", "outputIndexes": [ 741 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 721, 741 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/self_attn/Add_1_output_0", "outputIndexes": [ 742 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 871072866, 2097174, 262144, 0, 0 ] } , "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": [ 3103 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3103 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3104 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3104 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 743 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 744 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.7/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 745 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 744, 745, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.7/self_attn/Concat_2_output_0", "outputIndexes": [ 746 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 743, 746 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.7/self_attn/Reshape_2_output_0", "outputIndexes": [ 747 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 715, 742, 747, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.7/self_attn/FusedAttention", "outputIndexes": [ 748 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 748 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3105 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3105 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3106 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3106 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 873432184, 8388630, 1048576, 0, 0 ] } , "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": [ 3107 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3108 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3108 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669, 749 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_output_0", "outputIndexes": [ 750 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 882869390, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.7/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 751 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 751 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3109 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3109 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3110 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3110 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 882902158, 29360150, 3670016, 0, 0 ] } , "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": [ 3111 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3111 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3112 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 752 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.7/mlp/act_fn/Mul_output_0", "outputIndexes": [ 753 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3110 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 915932324, 29360150, 3670016, 0, 0 ] } , "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": [ 3115 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3115 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3116 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3116 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 754 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 753, 754 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/mlp/Mul_output_0", "outputIndexes": [ 755 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3117 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3117 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3118 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3118 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 948962490, 29360150, 3670016, 0, 0 ] } , "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": [ 3119 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3119 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3120 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3120 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 756 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750, 756 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.7/Add_1_output_0", "outputIndexes": [ 757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/Reshape_output_0", "outputIndexes": [ 758 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 758 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 981992656, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.8/input_layernorm/Mul_1_output_0", "outputIndexes": [ 759 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3121 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3121 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3122 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3122 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 982025424, 8388630, 1048576, 0, 0 ] } , "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": [ 3123 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3123 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3124 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 760 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_output_0", "outputIndexes": [ 761 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 761 ] , "main_type": "NONE", "name": "Shape1126", "outputIndexes": [ 762 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 761 ] , "main_type": "NONE", "name": "Rank1128", "outputIndexes": [ 763 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 763, 763 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1130", "outputIndexes": [ 764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1131", "outputIndexes": [ 765 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1133", "outputIndexes": [ 766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1134", "outputIndexes": [ 767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762, 765, 767, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1137", "outputIndexes": [ 768 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 768 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1138", "outputIndexes": [ 769 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769, 769 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1140", "outputIndexes": [ 770 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761, 770, 764 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_output_0", "outputIndexes": [ 771 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_output_0", "outputIndexes": [ 772 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1148", "outputIndexes": [ 773 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1151", "outputIndexes": [ 774 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762, 773, 774, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1154", "outputIndexes": [ 775 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 775 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1155", "outputIndexes": [ 776 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 776 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1156", "outputIndexes": [ 777 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 777, 776 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1157", "outputIndexes": [ 778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761, 778, 764 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_1_output_0", "outputIndexes": [ 779 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 780 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 772, 780, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_output_0", "outputIndexes": [ 781 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 760, 781 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_output_0", "outputIndexes": [ 782 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_output_0", "outputIndexes": [ 783 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_2_output_0", "outputIndexes": [ 784 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "Shape1164", "outputIndexes": [ 785 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "Rank1166", "outputIndexes": [ 786 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 786, 786 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1168", "outputIndexes": [ 787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1169", "outputIndexes": [ 788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1171", "outputIndexes": [ 789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1172", "outputIndexes": [ 790 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785, 788, 790, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1175", "outputIndexes": [ 791 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 791 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1176", "outputIndexes": [ 792 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 792 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1177", "outputIndexes": [ 793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793, 792 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1178", "outputIndexes": [ 794 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 794, 787 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_2_output_0", "outputIndexes": [ 795 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 795, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_output_0", "outputIndexes": [ 796 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 797 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 797, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_1_output_0", "outputIndexes": [ 798 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_output_0", "outputIndexes": [ 799 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 800 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 20, 800, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_output_0", "outputIndexes": [ 801 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 799, 801 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_3_output_0", "outputIndexes": [ 802 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 802, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_1_output_0", "outputIndexes": [ 803 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 783, 803 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_output_0", "outputIndexes": [ 804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3122 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 991462630, 2097174, 262144, 0, 0 ] } , "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": [ 3127 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3127 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3128 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3128 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 805 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 807 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 806, 807, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_1_output_0", "outputIndexes": [ 808 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805, 808 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_1_output_0", "outputIndexes": [ 809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_2_output_0", "outputIndexes": [ 810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809 ] , "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_3_output_0", "outputIndexes": [ 811 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 811 ] , "main_type": "NONE", "name": "Shape1197", "outputIndexes": [ 812 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 811 ] , "main_type": "NONE", "name": "Rank1199", "outputIndexes": [ 813 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 813, 813 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1201", "outputIndexes": [ 814 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1202", "outputIndexes": [ 815 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1204", "outputIndexes": [ 816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1205", "outputIndexes": [ 817 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 812, 815, 817, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1208", "outputIndexes": [ 818 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 818 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1209", "outputIndexes": [ 819 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 819 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1210", "outputIndexes": [ 820 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 820, 819 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1211", "outputIndexes": [ 821 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 821, 814 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.8/self_attn/Gather_3_output_0", "outputIndexes": [ 822 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 822, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Div_1_output_0", "outputIndexes": [ 823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 823, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 824 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 824, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_3_output_0", "outputIndexes": [ 825 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.8/self_attn/Neg_1_output_0", "outputIndexes": [ 826 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 823, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 827 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 20, 827, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.8/self_attn/Slice_2_output_0", "outputIndexes": [ 828 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 826, 828 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.8/self_attn/Concat_4_output_0", "outputIndexes": [ 829 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 829, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Mul_3_output_0", "outputIndexes": [ 830 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 810, 830 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/self_attn/Add_1_output_0", "outputIndexes": [ 831 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3122 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 993821948, 2097174, 262144, 0, 0 ] } , "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": [ 3131 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3131 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3132 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3132 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 832 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.8/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 834 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 833, 834, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.8/self_attn/Concat_2_output_0", "outputIndexes": [ 835 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 832, 835 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.8/self_attn/Reshape_2_output_0", "outputIndexes": [ 836 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 804, 831, 836, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.8/self_attn/FusedAttention", "outputIndexes": [ 837 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 837 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3133 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3133 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3134 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3134 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 996181266, 8388630, 1048576, 0, 0 ] } , "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": [ 3135 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3135 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3136 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 838 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 758, 838 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_output_0", "outputIndexes": [ 839 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1005618472, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.8/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 840 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 840 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3137 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3138 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3138 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1005651240, 29360150, 3670016, 0, 0 ] } , "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": [ 3139 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3139 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3140 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3140 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 841 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.8/mlp/act_fn/Mul_output_0", "outputIndexes": [ 842 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3138 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1038681406, 29360150, 3670016, 0, 0 ] } , "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": [ 3143 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3143 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3144 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3144 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 843 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 842, 843 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/mlp/Mul_output_0", "outputIndexes": [ 844 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 844 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3145 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3145 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3146 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3146 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1071711572, 29360150, 3670016, 0, 0 ] } , "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": [ 3147 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3147 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3148 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3148 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 845 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839, 845 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.8/Add_1_output_0", "outputIndexes": [ 846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 846, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/Reshape_output_0", "outputIndexes": [ 847 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1104741738, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.9/input_layernorm/Mul_1_output_0", "outputIndexes": [ 848 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3149 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3149 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3150 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1104774506, 8388630, 1048576, 0, 0 ] } , "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": [ 3151 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3151 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3152 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 849 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_output_0", "outputIndexes": [ 850 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 850 ] , "main_type": "NONE", "name": "Shape1257", "outputIndexes": [ 851 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 850 ] , "main_type": "NONE", "name": "Rank1259", "outputIndexes": [ 852 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 852 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1261", "outputIndexes": [ 853 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1262", "outputIndexes": [ 854 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1264", "outputIndexes": [ 855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1265", "outputIndexes": [ 856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 854, 856, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1268", "outputIndexes": [ 857 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 857 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1269", "outputIndexes": [ 858 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 858, 858 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1271", "outputIndexes": [ 859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850, 859, 853 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_output_0", "outputIndexes": [ 860 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_output_0", "outputIndexes": [ 861 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1279", "outputIndexes": [ 862 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1282", "outputIndexes": [ 863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 862, 863, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1285", "outputIndexes": [ 864 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 864 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1286", "outputIndexes": [ 865 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 865 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1287", "outputIndexes": [ 866 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 866, 865 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1288", "outputIndexes": [ 867 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850, 867, 853 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_1_output_0", "outputIndexes": [ 868 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 869 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 861, 869, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_output_0", "outputIndexes": [ 870 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849, 870 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_output_0", "outputIndexes": [ 871 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_output_0", "outputIndexes": [ 872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_2_output_0", "outputIndexes": [ 873 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 873 ] , "main_type": "NONE", "name": "Shape1295", "outputIndexes": [ 874 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 873 ] , "main_type": "NONE", "name": "Rank1297", "outputIndexes": [ 875 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 875 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1299", "outputIndexes": [ 876 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1300", "outputIndexes": [ 877 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1302", "outputIndexes": [ 878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1303", "outputIndexes": [ 879 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 874, 877, 879, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1306", "outputIndexes": [ 880 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1307", "outputIndexes": [ 881 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 881 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1308", "outputIndexes": [ 882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 882, 881 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1309", "outputIndexes": [ 883 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873, 883, 876 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_2_output_0", "outputIndexes": [ 884 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_output_0", "outputIndexes": [ 885 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 886 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 886, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_1_output_0", "outputIndexes": [ 887 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_output_0", "outputIndexes": [ 888 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 889 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 20, 889, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_output_0", "outputIndexes": [ 890 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 888, 890 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_3_output_0", "outputIndexes": [ 891 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_1_output_0", "outputIndexes": [ 892 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 872, 892 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_output_0", "outputIndexes": [ 893 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1114211712, 2097174, 262144, 0, 0 ] } , "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": [ 3155 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3155 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3156 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3156 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 894 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 895 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 896 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 895, 896, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_1_output_0", "outputIndexes": [ 897 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 894, 897 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_1_output_0", "outputIndexes": [ 898 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_2_output_0", "outputIndexes": [ 899 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898 ] , "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_3_output_0", "outputIndexes": [ 900 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 900 ] , "main_type": "NONE", "name": "Shape1328", "outputIndexes": [ 901 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 900 ] , "main_type": "NONE", "name": "Rank1330", "outputIndexes": [ 902 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 902, 902 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1332", "outputIndexes": [ 903 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 903 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1333", "outputIndexes": [ 904 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 903, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1335", "outputIndexes": [ 905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 905 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1336", "outputIndexes": [ 906 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 901, 904, 906, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1339", "outputIndexes": [ 907 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 907 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1340", "outputIndexes": [ 908 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 908 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1341", "outputIndexes": [ 909 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909, 908 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1342", "outputIndexes": [ 910 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900, 910, 903 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.9/self_attn/Gather_3_output_0", "outputIndexes": [ 911 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Div_1_output_0", "outputIndexes": [ 912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 912, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 913, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_3_output_0", "outputIndexes": [ 914 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.9/self_attn/Neg_1_output_0", "outputIndexes": [ 915 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 912, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 916 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 20, 916, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.9/self_attn/Slice_2_output_0", "outputIndexes": [ 917 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 915, 917 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.9/self_attn/Concat_4_output_0", "outputIndexes": [ 918 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 918, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Mul_3_output_0", "outputIndexes": [ 919 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 899, 919 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/self_attn/Add_1_output_0", "outputIndexes": [ 920 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1116571030, 2097174, 262144, 0, 0 ] } , "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": [ 3159 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3159 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3160 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3160 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 921 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.9/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 923 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 922, 923, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.9/self_attn/Concat_2_output_0", "outputIndexes": [ 924 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 921, 924 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.9/self_attn/Reshape_2_output_0", "outputIndexes": [ 925 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 893, 920, 925, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.9/self_attn/FusedAttention", "outputIndexes": [ 926 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 926 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3161 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3161 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3162 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3162 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1118930348, 8388630, 1048576, 0, 0 ] } , "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": [ 3163 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3163 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3164 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3164 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 927 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847, 927 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_output_0", "outputIndexes": [ 928 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1128367554, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.9/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 929 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 929 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3165 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3165 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3166 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3166 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1128400322, 29360150, 3670016, 0, 0 ] } , "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": [ 3167 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3167 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3168 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3168 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 930 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 930 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.9/mlp/act_fn/Mul_output_0", "outputIndexes": [ 931 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3166 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1161430488, 29360150, 3670016, 0, 0 ] } , "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": [ 3171 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3171 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3172 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3172 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 932 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 931, 932 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/mlp/Mul_output_0", "outputIndexes": [ 933 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 933 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3173 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3173 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3174 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1194460654, 29360150, 3670016, 0, 0 ] } , "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": [ 3175 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3175 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3176 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3176 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 934 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928, 934 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.9/Add_1_output_0", "outputIndexes": [ 935 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 935, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/Reshape_output_0", "outputIndexes": [ 936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 936 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1227490820, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.10/input_layernorm/Mul_1_output_0", "outputIndexes": [ 937 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3177 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3177 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3178 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3178 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1227523588, 8388630, 1048576, 0, 0 ] } , "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": [ 3179 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3180 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 938 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_output_0", "outputIndexes": [ 939 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 939 ] , "main_type": "NONE", "name": "Shape1388", "outputIndexes": [ 940 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 939 ] , "main_type": "NONE", "name": "Rank1390", "outputIndexes": [ 941 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 941, 941 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1392", "outputIndexes": [ 942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1393", "outputIndexes": [ 943 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1395", "outputIndexes": [ 944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1396", "outputIndexes": [ 945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940, 943, 945, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1399", "outputIndexes": [ 946 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1400", "outputIndexes": [ 947 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 947, 947 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1402", "outputIndexes": [ 948 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939, 948, 942 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_output_0", "outputIndexes": [ 949 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_output_0", "outputIndexes": [ 950 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1410", "outputIndexes": [ 951 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1413", "outputIndexes": [ 952 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940, 951, 952, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1416", "outputIndexes": [ 953 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1417", "outputIndexes": [ 954 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 954 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1418", "outputIndexes": [ 955 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 954 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1419", "outputIndexes": [ 956 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939, 956, 942 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_1_output_0", "outputIndexes": [ 957 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 958 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 950, 958, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_output_0", "outputIndexes": [ 959 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938, 959 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_output_0", "outputIndexes": [ 960 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_output_0", "outputIndexes": [ 961 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_2_output_0", "outputIndexes": [ 962 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 962 ] , "main_type": "NONE", "name": "Shape1426", "outputIndexes": [ 963 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 962 ] , "main_type": "NONE", "name": "Rank1428", "outputIndexes": [ 964 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 964, 964 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1430", "outputIndexes": [ 965 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 965 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1431", "outputIndexes": [ 966 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 965, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1433", "outputIndexes": [ 967 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 967 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1434", "outputIndexes": [ 968 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 963, 966, 968, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1437", "outputIndexes": [ 969 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 969 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1438", "outputIndexes": [ 970 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 970 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1439", "outputIndexes": [ 971 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 971, 970 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1440", "outputIndexes": [ 972 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962, 972, 965 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_2_output_0", "outputIndexes": [ 973 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_output_0", "outputIndexes": [ 974 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 974, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 975 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960, 975, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_1_output_0", "outputIndexes": [ 976 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_output_0", "outputIndexes": [ 977 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 974, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 978 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960, 20, 978, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_output_0", "outputIndexes": [ 979 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 977, 979 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_3_output_0", "outputIndexes": [ 980 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 980, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_1_output_0", "outputIndexes": [ 981 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 961, 981 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_output_0", "outputIndexes": [ 982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3178 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1236960794, 2097174, 262144, 0, 0 ] } , "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": [ 3183 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3183 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3184 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3184 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 983 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 984 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 985 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984, 985, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_1_output_0", "outputIndexes": [ 986 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 983, 986 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_1_output_0", "outputIndexes": [ 987 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_2_output_0", "outputIndexes": [ 988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987 ] , "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_3_output_0", "outputIndexes": [ 989 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 989 ] , "main_type": "NONE", "name": "Shape1459", "outputIndexes": [ 990 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 989 ] , "main_type": "NONE", "name": "Rank1461", "outputIndexes": [ 991 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 991, 991 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1463", "outputIndexes": [ 992 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1464", "outputIndexes": [ 993 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1466", "outputIndexes": [ 994 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 994 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1467", "outputIndexes": [ 995 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 990, 993, 995, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1470", "outputIndexes": [ 996 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 996 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1471", "outputIndexes": [ 997 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 997 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1472", "outputIndexes": [ 998 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 998, 997 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1473", "outputIndexes": [ 999 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 999, 992 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.10/self_attn/Gather_3_output_0", "outputIndexes": [ 1000 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1000, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Div_1_output_0", "outputIndexes": [ 1001 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1001, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1002 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 1002, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_3_output_0", "outputIndexes": [ 1003 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1003 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.10/self_attn/Neg_1_output_0", "outputIndexes": [ 1004 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1001, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1005 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 20, 1005, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.10/self_attn/Slice_2_output_0", "outputIndexes": [ 1006 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004, 1006 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.10/self_attn/Concat_4_output_0", "outputIndexes": [ 1007 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1007, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Mul_3_output_0", "outputIndexes": [ 1008 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 988, 1008 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/self_attn/Add_1_output_0", "outputIndexes": [ 1009 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3178 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1239320112, 2097174, 262144, 0, 0 ] } , "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": [ 3187 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3187 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3188 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3188 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1010 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1011 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.10/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1012 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1011, 1012, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.10/self_attn/Concat_2_output_0", "outputIndexes": [ 1013 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1010, 1013 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.10/self_attn/Reshape_2_output_0", "outputIndexes": [ 1014 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982, 1009, 1014, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.10/self_attn/FusedAttention", "outputIndexes": [ 1015 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1015 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3189 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3189 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3190 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3190 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1241679430, 8388630, 1048576, 0, 0 ] } , "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": [ 3191 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3191 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3192 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3192 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1016 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 936, 1016 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_output_0", "outputIndexes": [ 1017 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1251116636, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.10/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1018 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1018 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3193 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3193 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3194 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3194 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1251149404, 29360150, 3670016, 0, 0 ] } , "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": [ 3195 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3196 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3196 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1019 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1019 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.10/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1020 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3194 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1284179570, 29360150, 3670016, 0, 0 ] } , "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": [ 3199 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3199 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3200 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3200 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1021 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1020, 1021 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/mlp/Mul_output_0", "outputIndexes": [ 1022 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1022 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3201 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3201 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3202 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3202 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1317209736, 29360150, 3670016, 0, 0 ] } , "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": [ 3203 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3203 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3204 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3204 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1023 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017, 1023 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.10/Add_1_output_0", "outputIndexes": [ 1024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1024, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/Reshape_output_0", "outputIndexes": [ 1025 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1350239902, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.11/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1026 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3205 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3205 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3206 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3206 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1350272670, 8388630, 1048576, 0, 0 ] } , "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": [ 3207 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3207 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3208 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3208 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1027 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_output_0", "outputIndexes": [ 1028 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1028 ] , "main_type": "NONE", "name": "Shape1519", "outputIndexes": [ 1029 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1028 ] , "main_type": "NONE", "name": "Rank1521", "outputIndexes": [ 1030 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1030, 1030 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1523", "outputIndexes": [ 1031 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1524", "outputIndexes": [ 1032 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1526", "outputIndexes": [ 1033 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1527", "outputIndexes": [ 1034 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029, 1032, 1034, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1530", "outputIndexes": [ 1035 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1531", "outputIndexes": [ 1036 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036, 1036 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1533", "outputIndexes": [ 1037 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028, 1037, 1031 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_output_0", "outputIndexes": [ 1038 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1039 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1541", "outputIndexes": [ 1040 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1544", "outputIndexes": [ 1041 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029, 1040, 1041, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1547", "outputIndexes": [ 1042 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1042 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1548", "outputIndexes": [ 1043 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1043 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1549", "outputIndexes": [ 1044 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1044, 1043 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1550", "outputIndexes": [ 1045 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028, 1045, 1031 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_1_output_0", "outputIndexes": [ 1046 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1047 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1039, 1047, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_output_0", "outputIndexes": [ 1048 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027, 1048 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_output_0", "outputIndexes": [ 1049 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_output_0", "outputIndexes": [ 1050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_2_output_0", "outputIndexes": [ 1051 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1051 ] , "main_type": "NONE", "name": "Shape1557", "outputIndexes": [ 1052 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1051 ] , "main_type": "NONE", "name": "Rank1559", "outputIndexes": [ 1053 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1053, 1053 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1561", "outputIndexes": [ 1054 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1562", "outputIndexes": [ 1055 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1564", "outputIndexes": [ 1056 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1565", "outputIndexes": [ 1057 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1052, 1055, 1057, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1568", "outputIndexes": [ 1058 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1058 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1569", "outputIndexes": [ 1059 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1059 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1570", "outputIndexes": [ 1060 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1060, 1059 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1571", "outputIndexes": [ 1061 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051, 1061, 1054 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_2_output_0", "outputIndexes": [ 1062 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1062, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_output_0", "outputIndexes": [ 1063 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1064 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 1064, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_1_output_0", "outputIndexes": [ 1065 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1065 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_output_0", "outputIndexes": [ 1066 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 20, 1067, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_output_0", "outputIndexes": [ 1068 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1066, 1068 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_3_output_0", "outputIndexes": [ 1069 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1069, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_1_output_0", "outputIndexes": [ 1070 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1050, 1070 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_output_0", "outputIndexes": [ 1071 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3206 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1359709876, 2097174, 262144, 0, 0 ] } , "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": [ 3211 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3211 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3212 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3212 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1072 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1073 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1074 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 1074, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_1_output_0", "outputIndexes": [ 1075 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1072, 1075 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_1_output_0", "outputIndexes": [ 1076 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_2_output_0", "outputIndexes": [ 1077 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076 ] , "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_3_output_0", "outputIndexes": [ 1078 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1078 ] , "main_type": "NONE", "name": "Shape1590", "outputIndexes": [ 1079 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1078 ] , "main_type": "NONE", "name": "Rank1592", "outputIndexes": [ 1080 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1080, 1080 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1594", "outputIndexes": [ 1081 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1081 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1595", "outputIndexes": [ 1082 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1081, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1597", "outputIndexes": [ 1083 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1598", "outputIndexes": [ 1084 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1079, 1082, 1084, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1601", "outputIndexes": [ 1085 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1085 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1602", "outputIndexes": [ 1086 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1086 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1603", "outputIndexes": [ 1087 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1087, 1086 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1604", "outputIndexes": [ 1088 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078, 1088, 1081 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.11/self_attn/Gather_3_output_0", "outputIndexes": [ 1089 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1089, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Div_1_output_0", "outputIndexes": [ 1090 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1091 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 1091, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_3_output_0", "outputIndexes": [ 1092 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1092 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.11/self_attn/Neg_1_output_0", "outputIndexes": [ 1093 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1094 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 20, 1094, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.11/self_attn/Slice_2_output_0", "outputIndexes": [ 1095 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1093, 1095 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.11/self_attn/Concat_4_output_0", "outputIndexes": [ 1096 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1096, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Mul_3_output_0", "outputIndexes": [ 1097 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1077, 1097 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/self_attn/Add_1_output_0", "outputIndexes": [ 1098 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3206 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1362069194, 2097174, 262144, 0, 0 ] } , "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": [ 3215 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3215 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3216 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3216 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1099 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1100 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.11/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1101 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1100, 1101, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.11/self_attn/Concat_2_output_0", "outputIndexes": [ 1102 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1099, 1102 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.11/self_attn/Reshape_2_output_0", "outputIndexes": [ 1103 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1071, 1098, 1103, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.11/self_attn/FusedAttention", "outputIndexes": [ 1104 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1104 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3217 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3217 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3218 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3218 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1364428512, 8388630, 1048576, 0, 0 ] } , "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": [ 3219 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3219 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3220 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3220 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1105 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025, 1105 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_output_0", "outputIndexes": [ 1106 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1373865718, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.11/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1107 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1107 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3221 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3221 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3222 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3222 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1373898486, 29360150, 3670016, 0, 0 ] } , "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": [ 3223 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3224 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3224 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1108 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1108 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.11/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1109 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3222 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1406928652, 29360150, 3670016, 0, 0 ] } , "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": [ 3227 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3227 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3228 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3228 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1110 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1109, 1110 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/mlp/Mul_output_0", "outputIndexes": [ 1111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1111 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3229 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3230 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1439958818, 29360150, 3670016, 0, 0 ] } , "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": [ 3231 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3231 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3232 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3232 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1112 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106, 1112 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.11/Add_1_output_0", "outputIndexes": [ 1113 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1113, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/Reshape_output_0", "outputIndexes": [ 1114 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1114 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1472988984, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.12/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1115 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1115 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3233 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3233 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3234 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1473021752, 8388630, 1048576, 0, 0 ] } , "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": [ 3235 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3235 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3236 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1116 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1115 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_output_0", "outputIndexes": [ 1117 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1117 ] , "main_type": "NONE", "name": "Shape1650", "outputIndexes": [ 1118 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1117 ] , "main_type": "NONE", "name": "Rank1652", "outputIndexes": [ 1119 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1119, 1119 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1654", "outputIndexes": [ 1120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1655", "outputIndexes": [ 1121 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1657", "outputIndexes": [ 1122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1658", "outputIndexes": [ 1123 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 1121, 1123, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1661", "outputIndexes": [ 1124 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1662", "outputIndexes": [ 1125 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1125, 1125 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1664", "outputIndexes": [ 1126 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117, 1126, 1120 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_output_0", "outputIndexes": [ 1127 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1128 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1672", "outputIndexes": [ 1129 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1675", "outputIndexes": [ 1130 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 1129, 1130, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1678", "outputIndexes": [ 1131 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1131 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1679", "outputIndexes": [ 1132 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1132 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1680", "outputIndexes": [ 1133 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1133, 1132 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1681", "outputIndexes": [ 1134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117, 1134, 1120 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_1_output_0", "outputIndexes": [ 1135 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1136 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1128, 1136, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_output_0", "outputIndexes": [ 1137 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1116, 1137 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_output_0", "outputIndexes": [ 1138 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_output_0", "outputIndexes": [ 1139 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_2_output_0", "outputIndexes": [ 1140 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1140 ] , "main_type": "NONE", "name": "Shape1688", "outputIndexes": [ 1141 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1140 ] , "main_type": "NONE", "name": "Rank1690", "outputIndexes": [ 1142 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1142, 1142 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1692", "outputIndexes": [ 1143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1693", "outputIndexes": [ 1144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1695", "outputIndexes": [ 1145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1696", "outputIndexes": [ 1146 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 1144, 1146, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1699", "outputIndexes": [ 1147 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1147 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1700", "outputIndexes": [ 1148 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1148 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1701", "outputIndexes": [ 1149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149, 1148 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1702", "outputIndexes": [ 1150 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140, 1150, 1143 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_2_output_0", "outputIndexes": [ 1151 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1151, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_output_0", "outputIndexes": [ 1152 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1153 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 1153, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_1_output_0", "outputIndexes": [ 1154 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_output_0", "outputIndexes": [ 1155 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1156 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 20, 1156, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_output_0", "outputIndexes": [ 1157 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1155, 1157 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_3_output_0", "outputIndexes": [ 1158 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1158, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_1_output_0", "outputIndexes": [ 1159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1139, 1159 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_output_0", "outputIndexes": [ 1160 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1482458958, 2097174, 262144, 0, 0 ] } , "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": [ 3239 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3239 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3240 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3240 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1161 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1162 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1163 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1162, 1163, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_1_output_0", "outputIndexes": [ 1164 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1161, 1164 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_1_output_0", "outputIndexes": [ 1165 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_2_output_0", "outputIndexes": [ 1166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165 ] , "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_3_output_0", "outputIndexes": [ 1167 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "Shape1721", "outputIndexes": [ 1168 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "Rank1723", "outputIndexes": [ 1169 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1169, 1169 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1725", "outputIndexes": [ 1170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1726", "outputIndexes": [ 1171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1728", "outputIndexes": [ 1172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1172 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1729", "outputIndexes": [ 1173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 1171, 1173, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1732", "outputIndexes": [ 1174 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1174 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1733", "outputIndexes": [ 1175 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1175 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1734", "outputIndexes": [ 1176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1176, 1175 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1735", "outputIndexes": [ 1177 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 1177, 1170 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.12/self_attn/Gather_3_output_0", "outputIndexes": [ 1178 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1178, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Div_1_output_0", "outputIndexes": [ 1179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1180 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1180, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_3_output_0", "outputIndexes": [ 1181 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.12/self_attn/Neg_1_output_0", "outputIndexes": [ 1182 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 20, 1183, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.12/self_attn/Slice_2_output_0", "outputIndexes": [ 1184 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1182, 1184 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.12/self_attn/Concat_4_output_0", "outputIndexes": [ 1185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1185, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Mul_3_output_0", "outputIndexes": [ 1186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1166, 1186 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/self_attn/Add_1_output_0", "outputIndexes": [ 1187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1484818276, 2097174, 262144, 0, 0 ] } , "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": [ 3243 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3244 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3244 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1188 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.12/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1190 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1189, 1190, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.12/self_attn/Concat_2_output_0", "outputIndexes": [ 1191 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 1191 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.12/self_attn/Reshape_2_output_0", "outputIndexes": [ 1192 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1160, 1187, 1192, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.12/self_attn/FusedAttention", "outputIndexes": [ 1193 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1193 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3245 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3245 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3246 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3246 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1487177594, 8388630, 1048576, 0, 0 ] } , "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": [ 3247 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3247 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3248 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3248 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1194 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1114, 1194 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_output_0", "outputIndexes": [ 1195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1496614800, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.12/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1196 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1196 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3249 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3249 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3250 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3250 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1496647568, 29360150, 3670016, 0, 0 ] } , "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": [ 3251 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3251 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3252 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3252 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1197 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.12/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1198 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3250 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1529677734, 29360150, 3670016, 0, 0 ] } , "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": [ 3255 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3255 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3256 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3256 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1199 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1198, 1199 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/mlp/Mul_output_0", "outputIndexes": [ 1200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1200 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3257 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3257 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3258 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3258 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1562707900, 29360150, 3670016, 0, 0 ] } , "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": [ 3259 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3259 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3260 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3260 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1201 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195, 1201 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.12/Add_1_output_0", "outputIndexes": [ 1202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1202, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/Reshape_output_0", "outputIndexes": [ 1203 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1595738066, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.13/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1204 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3261 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3261 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3262 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3262 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1595770834, 8388630, 1048576, 0, 0 ] } , "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": [ 3263 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3263 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3264 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3264 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1205 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_output_0", "outputIndexes": [ 1206 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "Shape1781", "outputIndexes": [ 1207 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "Rank1783", "outputIndexes": [ 1208 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1208, 1208 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1785", "outputIndexes": [ 1209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1786", "outputIndexes": [ 1210 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1788", "outputIndexes": [ 1211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1789", "outputIndexes": [ 1212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1210, 1212, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1792", "outputIndexes": [ 1213 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1793", "outputIndexes": [ 1214 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1214, 1214 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1795", "outputIndexes": [ 1215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1215, 1209 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_output_0", "outputIndexes": [ 1216 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1217 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1803", "outputIndexes": [ 1218 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1806", "outputIndexes": [ 1219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1218, 1219, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1809", "outputIndexes": [ 1220 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1220 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1810", "outputIndexes": [ 1221 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1221 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1811", "outputIndexes": [ 1222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222, 1221 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1812", "outputIndexes": [ 1223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1223, 1209 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_1_output_0", "outputIndexes": [ 1224 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1225 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217, 1225, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_output_0", "outputIndexes": [ 1226 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1205, 1226 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_output_0", "outputIndexes": [ 1227 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_output_0", "outputIndexes": [ 1228 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_2_output_0", "outputIndexes": [ 1229 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1229 ] , "main_type": "NONE", "name": "Shape1819", "outputIndexes": [ 1230 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1229 ] , "main_type": "NONE", "name": "Rank1821", "outputIndexes": [ 1231 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1231, 1231 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1823", "outputIndexes": [ 1232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1824", "outputIndexes": [ 1233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1826", "outputIndexes": [ 1234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1827", "outputIndexes": [ 1235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1230, 1233, 1235, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1830", "outputIndexes": [ 1236 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1236 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1831", "outputIndexes": [ 1237 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1237 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1832", "outputIndexes": [ 1238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1238, 1237 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1833", "outputIndexes": [ 1239 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 1239, 1232 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_2_output_0", "outputIndexes": [ 1240 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_output_0", "outputIndexes": [ 1241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1241, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1242 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 1242, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_1_output_0", "outputIndexes": [ 1243 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1243 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_output_0", "outputIndexes": [ 1244 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1241, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1245 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 20, 1245, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_output_0", "outputIndexes": [ 1246 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1244, 1246 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_3_output_0", "outputIndexes": [ 1247 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_1_output_0", "outputIndexes": [ 1248 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1228, 1248 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_output_0", "outputIndexes": [ 1249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3262 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1605208040, 2097174, 262144, 0, 0 ] } , "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": [ 3267 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3267 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3268 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3268 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1250 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1251 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1252 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1251, 1252, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_1_output_0", "outputIndexes": [ 1253 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1250, 1253 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_1_output_0", "outputIndexes": [ 1254 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_2_output_0", "outputIndexes": [ 1255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254 ] , "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_3_output_0", "outputIndexes": [ 1256 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1256 ] , "main_type": "NONE", "name": "Shape1852", "outputIndexes": [ 1257 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1256 ] , "main_type": "NONE", "name": "Rank1854", "outputIndexes": [ 1258 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258, 1258 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1856", "outputIndexes": [ 1259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1857", "outputIndexes": [ 1260 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1859", "outputIndexes": [ 1261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1860", "outputIndexes": [ 1262 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1257, 1260, 1262, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1863", "outputIndexes": [ 1263 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1263 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1864", "outputIndexes": [ 1264 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1264 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1865", "outputIndexes": [ 1265 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1265, 1264 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1866", "outputIndexes": [ 1266 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256, 1266, 1259 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.13/self_attn/Gather_3_output_0", "outputIndexes": [ 1267 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1267, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Div_1_output_0", "outputIndexes": [ 1268 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1269 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 1269, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_3_output_0", "outputIndexes": [ 1270 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1270 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.13/self_attn/Neg_1_output_0", "outputIndexes": [ 1271 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1272 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 20, 1272, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.13/self_attn/Slice_2_output_0", "outputIndexes": [ 1273 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271, 1273 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.13/self_attn/Concat_4_output_0", "outputIndexes": [ 1274 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1274, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Mul_3_output_0", "outputIndexes": [ 1275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1255, 1275 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/self_attn/Add_1_output_0", "outputIndexes": [ 1276 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3262 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1607567358, 2097174, 262144, 0, 0 ] } , "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": [ 3271 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3271 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3272 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3272 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1277 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1278 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.13/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1279 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1278, 1279, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.13/self_attn/Concat_2_output_0", "outputIndexes": [ 1280 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1277, 1280 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.13/self_attn/Reshape_2_output_0", "outputIndexes": [ 1281 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249, 1276, 1281, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.13/self_attn/FusedAttention", "outputIndexes": [ 1282 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1282 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3273 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3273 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3274 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3274 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1609926676, 8388630, 1048576, 0, 0 ] } , "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": [ 3275 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3275 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3276 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3276 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1283 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203, 1283 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_output_0", "outputIndexes": [ 1284 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1619363882, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.13/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1285 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1285 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3277 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3277 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3278 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3278 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1619396650, 29360150, 3670016, 0, 0 ] } , "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": [ 3279 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3279 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3280 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1286 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1286 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.13/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1287 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3278 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1652426816, 29360150, 3670016, 0, 0 ] } , "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": [ 3283 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3283 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3284 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3284 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1288 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1287, 1288 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/mlp/Mul_output_0", "outputIndexes": [ 1289 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1289 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3285 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3285 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3286 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3286 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1685456982, 29360150, 3670016, 0, 0 ] } , "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": [ 3287 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3287 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3288 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1290 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284, 1290 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.13/Add_1_output_0", "outputIndexes": [ 1291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1291, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/Reshape_output_0", "outputIndexes": [ 1292 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1292 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1718487148, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.14/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1293 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1293 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3289 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3289 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3290 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3290 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1718519916, 8388630, 1048576, 0, 0 ] } , "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": [ 3291 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3291 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3292 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3292 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1294 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1293 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_output_0", "outputIndexes": [ 1295 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1295 ] , "main_type": "NONE", "name": "Shape1912", "outputIndexes": [ 1296 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1295 ] , "main_type": "NONE", "name": "Rank1914", "outputIndexes": [ 1297 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1297, 1297 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1916", "outputIndexes": [ 1298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1917", "outputIndexes": [ 1299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1919", "outputIndexes": [ 1300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1920", "outputIndexes": [ 1301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1296, 1299, 1301, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1923", "outputIndexes": [ 1302 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1302 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1924", "outputIndexes": [ 1303 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1303, 1303 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1926", "outputIndexes": [ 1304 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 1304, 1298 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_output_0", "outputIndexes": [ 1305 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1306 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1934", "outputIndexes": [ 1307 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1937", "outputIndexes": [ 1308 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1296, 1307, 1308, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1940", "outputIndexes": [ 1309 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1309 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1941", "outputIndexes": [ 1310 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1310 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1942", "outputIndexes": [ 1311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1311, 1310 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1943", "outputIndexes": [ 1312 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 1312, 1298 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_1_output_0", "outputIndexes": [ 1313 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1314 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1306, 1314, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_output_0", "outputIndexes": [ 1315 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1294, 1315 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_output_0", "outputIndexes": [ 1316 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_output_0", "outputIndexes": [ 1317 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_2_output_0", "outputIndexes": [ 1318 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1318 ] , "main_type": "NONE", "name": "Shape1950", "outputIndexes": [ 1319 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1318 ] , "main_type": "NONE", "name": "Rank1952", "outputIndexes": [ 1320 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320, 1320 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1954", "outputIndexes": [ 1321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1955", "outputIndexes": [ 1322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1321, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1957", "outputIndexes": [ 1323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1323 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1958", "outputIndexes": [ 1324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1319, 1322, 1324, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1961", "outputIndexes": [ 1325 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1325 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1962", "outputIndexes": [ 1326 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1326 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1963", "outputIndexes": [ 1327 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327, 1326 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1964", "outputIndexes": [ 1328 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 1328, 1321 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_2_output_0", "outputIndexes": [ 1329 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1329, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_output_0", "outputIndexes": [ 1330 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1331 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 1331, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_1_output_0", "outputIndexes": [ 1332 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1332 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_output_0", "outputIndexes": [ 1333 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1334 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 20, 1334, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_output_0", "outputIndexes": [ 1335 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1333, 1335 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_3_output_0", "outputIndexes": [ 1336 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1336, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_1_output_0", "outputIndexes": [ 1337 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317, 1337 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_output_0", "outputIndexes": [ 1338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3290 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1727957122, 2097174, 262144, 0, 0 ] } , "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": [ 3295 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3295 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3296 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3296 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1339 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1340 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1341 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 1341, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_1_output_0", "outputIndexes": [ 1342 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1339, 1342 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_1_output_0", "outputIndexes": [ 1343 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_2_output_0", "outputIndexes": [ 1344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343 ] , "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_3_output_0", "outputIndexes": [ 1345 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1345 ] , "main_type": "NONE", "name": "Shape1983", "outputIndexes": [ 1346 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1345 ] , "main_type": "NONE", "name": "Rank1985", "outputIndexes": [ 1347 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1347, 1347 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1987", "outputIndexes": [ 1348 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1988", "outputIndexes": [ 1349 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1990", "outputIndexes": [ 1350 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1350 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1991", "outputIndexes": [ 1351 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1346, 1349, 1351, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1994", "outputIndexes": [ 1352 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1352 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1995", "outputIndexes": [ 1353 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1353 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1996", "outputIndexes": [ 1354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354, 1353 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1997", "outputIndexes": [ 1355 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 1355, 1348 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.14/self_attn/Gather_3_output_0", "outputIndexes": [ 1356 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1356, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Div_1_output_0", "outputIndexes": [ 1357 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1357, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1358 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 1358, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_3_output_0", "outputIndexes": [ 1359 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1359 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.14/self_attn/Neg_1_output_0", "outputIndexes": [ 1360 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1357, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1361 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 20, 1361, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.14/self_attn/Slice_2_output_0", "outputIndexes": [ 1362 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1360, 1362 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.14/self_attn/Concat_4_output_0", "outputIndexes": [ 1363 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1363, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Mul_3_output_0", "outputIndexes": [ 1364 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1344, 1364 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/self_attn/Add_1_output_0", "outputIndexes": [ 1365 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3290 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1730316440, 2097174, 262144, 0, 0 ] } , "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": [ 3299 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3299 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3300 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3300 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1366 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1367 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.14/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1368 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1367, 1368, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.14/self_attn/Concat_2_output_0", "outputIndexes": [ 1369 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1366, 1369 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.14/self_attn/Reshape_2_output_0", "outputIndexes": [ 1370 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1338, 1365, 1370, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.14/self_attn/FusedAttention", "outputIndexes": [ 1371 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1371 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3301 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3301 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3302 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3302 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1732675758, 8388630, 1048576, 0, 0 ] } , "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": [ 3303 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3303 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3304 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3304 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1372 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1292, 1372 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_output_0", "outputIndexes": [ 1373 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1373 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1742112964, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.14/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1374 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3305 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3305 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3306 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3306 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1742145732, 29360150, 3670016, 0, 0 ] } , "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": [ 3307 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3307 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3308 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3308 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1375 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1375 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.14/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1376 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3306 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1775175898, 29360150, 3670016, 0, 0 ] } , "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": [ 3311 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3311 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3312 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3312 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1377 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1376, 1377 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/mlp/Mul_output_0", "outputIndexes": [ 1378 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1378 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3313 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3313 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3314 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3314 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1808206064, 29360150, 3670016, 0, 0 ] } , "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": [ 3315 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3315 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3316 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3316 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1379 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1373, 1379 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.14/Add_1_output_0", "outputIndexes": [ 1380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1380, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/Reshape_output_0", "outputIndexes": [ 1381 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1381 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1841236230, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.15/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1382 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3317 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3317 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3318 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3318 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1841268998, 8388630, 1048576, 0, 0 ] } , "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": [ 3319 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3319 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3320 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1383 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_output_0", "outputIndexes": [ 1384 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1384 ] , "main_type": "NONE", "name": "Shape2043", "outputIndexes": [ 1385 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1384 ] , "main_type": "NONE", "name": "Rank2045", "outputIndexes": [ 1386 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1386, 1386 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2047", "outputIndexes": [ 1387 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2048", "outputIndexes": [ 1388 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2050", "outputIndexes": [ 1389 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2051", "outputIndexes": [ 1390 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385, 1388, 1390, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2054", "outputIndexes": [ 1391 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2055", "outputIndexes": [ 1392 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1392, 1392 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2057", "outputIndexes": [ 1393 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384, 1393, 1387 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_output_0", "outputIndexes": [ 1394 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1395 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2065", "outputIndexes": [ 1396 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2068", "outputIndexes": [ 1397 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385, 1396, 1397, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2071", "outputIndexes": [ 1398 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1398 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2072", "outputIndexes": [ 1399 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1399 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2073", "outputIndexes": [ 1400 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1400, 1399 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2074", "outputIndexes": [ 1401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384, 1401, 1387 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_1_output_0", "outputIndexes": [ 1402 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1403 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1395, 1403, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_output_0", "outputIndexes": [ 1404 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383, 1404 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_output_0", "outputIndexes": [ 1405 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_output_0", "outputIndexes": [ 1406 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_2_output_0", "outputIndexes": [ 1407 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1407 ] , "main_type": "NONE", "name": "Shape2081", "outputIndexes": [ 1408 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1407 ] , "main_type": "NONE", "name": "Rank2083", "outputIndexes": [ 1409 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1409, 1409 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2085", "outputIndexes": [ 1410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2086", "outputIndexes": [ 1411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2088", "outputIndexes": [ 1412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2089", "outputIndexes": [ 1413 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408, 1411, 1413, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2092", "outputIndexes": [ 1414 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1414 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2093", "outputIndexes": [ 1415 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1415 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2094", "outputIndexes": [ 1416 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1416, 1415 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2095", "outputIndexes": [ 1417 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 1417, 1410 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_2_output_0", "outputIndexes": [ 1418 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1418, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_output_0", "outputIndexes": [ 1419 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1420 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 1420, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_1_output_0", "outputIndexes": [ 1421 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_output_0", "outputIndexes": [ 1422 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1423 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 20, 1423, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_output_0", "outputIndexes": [ 1424 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1422, 1424 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_3_output_0", "outputIndexes": [ 1425 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1425, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_1_output_0", "outputIndexes": [ 1426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1406, 1426 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_output_0", "outputIndexes": [ 1427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3318 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1850706204, 2097174, 262144, 0, 0 ] } , "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": [ 3323 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3323 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3324 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3324 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1428 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1429 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1430 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1429, 1430, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_1_output_0", "outputIndexes": [ 1431 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 1431 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_1_output_0", "outputIndexes": [ 1432 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_2_output_0", "outputIndexes": [ 1433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432 ] , "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_3_output_0", "outputIndexes": [ 1434 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1434 ] , "main_type": "NONE", "name": "Shape2114", "outputIndexes": [ 1435 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1434 ] , "main_type": "NONE", "name": "Rank2116", "outputIndexes": [ 1436 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 1436 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2118", "outputIndexes": [ 1437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1437 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2119", "outputIndexes": [ 1438 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1437, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2121", "outputIndexes": [ 1439 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1439 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2122", "outputIndexes": [ 1440 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1435, 1438, 1440, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2125", "outputIndexes": [ 1441 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2126", "outputIndexes": [ 1442 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1442 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2127", "outputIndexes": [ 1443 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1443, 1442 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2128", "outputIndexes": [ 1444 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 1444, 1437 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.15/self_attn/Gather_3_output_0", "outputIndexes": [ 1445 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1445, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Div_1_output_0", "outputIndexes": [ 1446 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1446, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1447 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432, 1447, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_3_output_0", "outputIndexes": [ 1448 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1448 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.15/self_attn/Neg_1_output_0", "outputIndexes": [ 1449 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1446, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432, 20, 1450, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.15/self_attn/Slice_2_output_0", "outputIndexes": [ 1451 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1449, 1451 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.15/self_attn/Concat_4_output_0", "outputIndexes": [ 1452 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1452, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Mul_3_output_0", "outputIndexes": [ 1453 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433, 1453 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/self_attn/Add_1_output_0", "outputIndexes": [ 1454 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3318 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1853065522, 2097174, 262144, 0, 0 ] } , "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": [ 3327 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3327 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3328 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3328 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1456 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.15/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1457 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1456, 1457, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.15/self_attn/Concat_2_output_0", "outputIndexes": [ 1458 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1455, 1458 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.15/self_attn/Reshape_2_output_0", "outputIndexes": [ 1459 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1427, 1454, 1459, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.15/self_attn/FusedAttention", "outputIndexes": [ 1460 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1460 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3329 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3329 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3330 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3330 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1855424840, 8388630, 1048576, 0, 0 ] } , "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": [ 3331 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3331 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3332 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3332 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1461 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1381, 1461 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_output_0", "outputIndexes": [ 1462 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1864862046, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.15/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1463 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1463 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3333 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3333 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3334 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3334 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1864894814, 29360150, 3670016, 0, 0 ] } , "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": [ 3335 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3335 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3336 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1464 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1464 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.15/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1465 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3334 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1897924980, 29360150, 3670016, 0, 0 ] } , "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": [ 3339 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3339 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3340 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3340 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1465, 1466 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/mlp/Mul_output_0", "outputIndexes": [ 1467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3341 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3341 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3342 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3342 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1930955146, 29360150, 3670016, 0, 0 ] } , "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": [ 3343 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3343 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3344 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3344 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1468 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 1468 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.15/Add_1_output_0", "outputIndexes": [ 1469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1469, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/Reshape_output_0", "outputIndexes": [ 1470 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1470 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1963985312, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.16/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1471 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3345 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3345 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3346 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3346 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1964018080, 8388630, 1048576, 0, 0 ] } , "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": [ 3347 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3347 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3348 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3348 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1472 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_output_0", "outputIndexes": [ 1473 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1473 ] , "main_type": "NONE", "name": "Shape2174", "outputIndexes": [ 1474 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1473 ] , "main_type": "NONE", "name": "Rank2176", "outputIndexes": [ 1475 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1475, 1475 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2178", "outputIndexes": [ 1476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2179", "outputIndexes": [ 1477 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2181", "outputIndexes": [ 1478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2182", "outputIndexes": [ 1479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1474, 1477, 1479, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2185", "outputIndexes": [ 1480 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1480 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2186", "outputIndexes": [ 1481 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1481, 1481 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2188", "outputIndexes": [ 1482 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473, 1482, 1476 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_output_0", "outputIndexes": [ 1483 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1484 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2196", "outputIndexes": [ 1485 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2199", "outputIndexes": [ 1486 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1474, 1485, 1486, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2202", "outputIndexes": [ 1487 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1487 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2203", "outputIndexes": [ 1488 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1488 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2204", "outputIndexes": [ 1489 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1489, 1488 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2205", "outputIndexes": [ 1490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473, 1490, 1476 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_1_output_0", "outputIndexes": [ 1491 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1492 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1484, 1492, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_output_0", "outputIndexes": [ 1493 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472, 1493 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_output_0", "outputIndexes": [ 1494 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_output_0", "outputIndexes": [ 1495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_2_output_0", "outputIndexes": [ 1496 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1496 ] , "main_type": "NONE", "name": "Shape2212", "outputIndexes": [ 1497 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1496 ] , "main_type": "NONE", "name": "Rank2214", "outputIndexes": [ 1498 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1498, 1498 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2216", "outputIndexes": [ 1499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2217", "outputIndexes": [ 1500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2219", "outputIndexes": [ 1501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2220", "outputIndexes": [ 1502 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497, 1500, 1502, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2223", "outputIndexes": [ 1503 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2224", "outputIndexes": [ 1504 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1504 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2225", "outputIndexes": [ 1505 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1505, 1504 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2226", "outputIndexes": [ 1506 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 1506, 1499 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_2_output_0", "outputIndexes": [ 1507 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1507, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_output_0", "outputIndexes": [ 1508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1508, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1509 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 1509, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_1_output_0", "outputIndexes": [ 1510 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_output_0", "outputIndexes": [ 1511 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1508, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1512 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 20, 1512, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_output_0", "outputIndexes": [ 1513 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1511, 1513 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_3_output_0", "outputIndexes": [ 1514 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1514, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_1_output_0", "outputIndexes": [ 1515 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1495, 1515 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_output_0", "outputIndexes": [ 1516 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3346 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1973455286, 2097174, 262144, 0, 0 ] } , "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": [ 3351 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3351 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3352 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3352 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1517 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1518 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1519 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1518, 1519, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_1_output_0", "outputIndexes": [ 1520 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1517, 1520 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_1_output_0", "outputIndexes": [ 1521 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_2_output_0", "outputIndexes": [ 1522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521 ] , "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_3_output_0", "outputIndexes": [ 1523 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1523 ] , "main_type": "NONE", "name": "Shape2245", "outputIndexes": [ 1524 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1523 ] , "main_type": "NONE", "name": "Rank2247", "outputIndexes": [ 1525 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1525, 1525 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2249", "outputIndexes": [ 1526 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2250", "outputIndexes": [ 1527 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2252", "outputIndexes": [ 1528 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1528 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2253", "outputIndexes": [ 1529 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524, 1527, 1529, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2256", "outputIndexes": [ 1530 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1530 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2257", "outputIndexes": [ 1531 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1531 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2258", "outputIndexes": [ 1532 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1532, 1531 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2259", "outputIndexes": [ 1533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523, 1533, 1526 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.16/self_attn/Gather_3_output_0", "outputIndexes": [ 1534 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Div_1_output_0", "outputIndexes": [ 1535 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1536 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 1536, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_3_output_0", "outputIndexes": [ 1537 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.16/self_attn/Neg_1_output_0", "outputIndexes": [ 1538 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1539 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 20, 1539, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.16/self_attn/Slice_2_output_0", "outputIndexes": [ 1540 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1538, 1540 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.16/self_attn/Concat_4_output_0", "outputIndexes": [ 1541 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1541, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Mul_3_output_0", "outputIndexes": [ 1542 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1522, 1542 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/self_attn/Add_1_output_0", "outputIndexes": [ 1543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3346 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1975814604, 2097174, 262144, 0, 0 ] } , "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": [ 3355 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3355 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3356 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3356 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1544 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1545 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.16/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1546 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1545, 1546, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.16/self_attn/Concat_2_output_0", "outputIndexes": [ 1547 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1544, 1547 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.16/self_attn/Reshape_2_output_0", "outputIndexes": [ 1548 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1516, 1543, 1548, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.16/self_attn/FusedAttention", "outputIndexes": [ 1549 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1549 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3357 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3357 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3358 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3358 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1978173922, 8388630, 1048576, 0, 0 ] } , "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": [ 3359 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3359 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3360 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1550 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1470, 1550 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_output_0", "outputIndexes": [ 1551 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1987611128, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.16/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1552 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1552 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3361 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3361 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3362 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3362 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1987643896, 29360150, 3670016, 0, 0 ] } , "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": [ 3363 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3363 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3364 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1553 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1553 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.16/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1554 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3362 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2020674062, 29360150, 3670016, 0, 0 ] } , "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": [ 3367 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3367 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3368 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3368 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1555 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1554, 1555 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/mlp/Mul_output_0", "outputIndexes": [ 1556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1556 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3369 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3369 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3370 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3370 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2053704228, 29360150, 3670016, 0, 0 ] } , "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": [ 3371 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3371 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3372 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3372 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1557 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551, 1557 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.16/Add_1_output_0", "outputIndexes": [ 1558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/Reshape_output_0", "outputIndexes": [ 1559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1559 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2086734394, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.17/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1560 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3373 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3373 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3374 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3374 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2086767162, 8388630, 1048576, 0, 0 ] } , "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": [ 3375 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3375 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3376 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3376 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1561 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_output_0", "outputIndexes": [ 1562 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "Shape2305", "outputIndexes": [ 1563 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "Rank2307", "outputIndexes": [ 1564 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564, 1564 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2309", "outputIndexes": [ 1565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2310", "outputIndexes": [ 1566 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2312", "outputIndexes": [ 1567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2313", "outputIndexes": [ 1568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1563, 1566, 1568, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2316", "outputIndexes": [ 1569 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2317", "outputIndexes": [ 1570 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1570, 1570 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2319", "outputIndexes": [ 1571 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562, 1571, 1565 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_output_0", "outputIndexes": [ 1572 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1573 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2327", "outputIndexes": [ 1574 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2330", "outputIndexes": [ 1575 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1563, 1574, 1575, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2333", "outputIndexes": [ 1576 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1576 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2334", "outputIndexes": [ 1577 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1577 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2335", "outputIndexes": [ 1578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1578, 1577 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2336", "outputIndexes": [ 1579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562, 1579, 1565 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_1_output_0", "outputIndexes": [ 1580 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1581 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1573, 1581, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_output_0", "outputIndexes": [ 1582 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1561, 1582 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_output_0", "outputIndexes": [ 1583 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_output_0", "outputIndexes": [ 1584 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_2_output_0", "outputIndexes": [ 1585 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1585 ] , "main_type": "NONE", "name": "Shape2343", "outputIndexes": [ 1586 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1585 ] , "main_type": "NONE", "name": "Rank2345", "outputIndexes": [ 1587 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1587, 1587 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2347", "outputIndexes": [ 1588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2348", "outputIndexes": [ 1589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1588, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2350", "outputIndexes": [ 1590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2351", "outputIndexes": [ 1591 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1586, 1589, 1591, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2354", "outputIndexes": [ 1592 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1592 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2355", "outputIndexes": [ 1593 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1593 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2356", "outputIndexes": [ 1594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594, 1593 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2357", "outputIndexes": [ 1595 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585, 1595, 1588 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_2_output_0", "outputIndexes": [ 1596 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_output_0", "outputIndexes": [ 1597 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1597, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1598 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 1598, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_1_output_0", "outputIndexes": [ 1599 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_output_0", "outputIndexes": [ 1600 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1597, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1601 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 20, 1601, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_output_0", "outputIndexes": [ 1602 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1600, 1602 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_3_output_0", "outputIndexes": [ 1603 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_1_output_0", "outputIndexes": [ 1604 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1584, 1604 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_output_0", "outputIndexes": [ 1605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3374 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2096204368, 2097174, 262144, 0, 0 ] } , "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": [ 3379 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3379 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3380 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3380 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1606 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1608 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1607, 1608, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_1_output_0", "outputIndexes": [ 1609 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 1609 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_1_output_0", "outputIndexes": [ 1610 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_2_output_0", "outputIndexes": [ 1611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610 ] , "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_3_output_0", "outputIndexes": [ 1612 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1612 ] , "main_type": "NONE", "name": "Shape2376", "outputIndexes": [ 1613 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1612 ] , "main_type": "NONE", "name": "Rank2378", "outputIndexes": [ 1614 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1614, 1614 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2380", "outputIndexes": [ 1615 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1615 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2381", "outputIndexes": [ 1616 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1615, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2383", "outputIndexes": [ 1617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2384", "outputIndexes": [ 1618 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1613, 1616, 1618, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2387", "outputIndexes": [ 1619 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2388", "outputIndexes": [ 1620 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1620 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2389", "outputIndexes": [ 1621 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1621, 1620 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2390", "outputIndexes": [ 1622 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 1622, 1615 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.17/self_attn/Gather_3_output_0", "outputIndexes": [ 1623 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1623, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Div_1_output_0", "outputIndexes": [ 1624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1625 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610, 1625, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_3_output_0", "outputIndexes": [ 1626 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.17/self_attn/Neg_1_output_0", "outputIndexes": [ 1627 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1628 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610, 20, 1628, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.17/self_attn/Slice_2_output_0", "outputIndexes": [ 1629 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1627, 1629 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.17/self_attn/Concat_4_output_0", "outputIndexes": [ 1630 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Mul_3_output_0", "outputIndexes": [ 1631 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1611, 1631 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/self_attn/Add_1_output_0", "outputIndexes": [ 1632 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3374 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2098563686, 2097174, 262144, 0, 0 ] } , "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": [ 3383 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3383 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3384 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3384 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1633 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.17/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1635 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1634, 1635, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.17/self_attn/Concat_2_output_0", "outputIndexes": [ 1636 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633, 1636 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.17/self_attn/Reshape_2_output_0", "outputIndexes": [ 1637 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1605, 1632, 1637, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.17/self_attn/FusedAttention", "outputIndexes": [ 1638 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1638 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3385 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3385 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3386 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2100923004, 8388630, 1048576, 0, 0 ] } , "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": [ 3387 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3387 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3388 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3388 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1639 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1559, 1639 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_output_0", "outputIndexes": [ 1640 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2110360210, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.17/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1641 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1641 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3389 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3389 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3390 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3390 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2110392978, 29360150, 3670016, 0, 0 ] } , "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": [ 3391 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3392 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3392 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1642 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1642 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.17/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1643 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3390 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2143423144, 29360150, 3670016, 0, 0 ] } , "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": [ 3395 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3395 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3396 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3396 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1644 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1643, 1644 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/mlp/Mul_output_0", "outputIndexes": [ 1645 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1645 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3397 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3397 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3398 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3398 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2176453310, 29360150, 3670016, 0, 0 ] } , "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": [ 3399 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3399 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3400 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3400 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1646 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 1646 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.17/Add_1_output_0", "outputIndexes": [ 1647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1647, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/Reshape_output_0", "outputIndexes": [ 1648 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2209483476, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.18/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1649 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1649 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3401 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3401 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3402 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3402 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2209516244, 8388630, 1048576, 0, 0 ] } , "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": [ 3403 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3403 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3404 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3404 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1650 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1649 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_output_0", "outputIndexes": [ 1651 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1651 ] , "main_type": "NONE", "name": "Shape2436", "outputIndexes": [ 1652 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1651 ] , "main_type": "NONE", "name": "Rank2438", "outputIndexes": [ 1653 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1653 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2440", "outputIndexes": [ 1654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2441", "outputIndexes": [ 1655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2443", "outputIndexes": [ 1656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2444", "outputIndexes": [ 1657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1652, 1655, 1657, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2447", "outputIndexes": [ 1658 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1658 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2448", "outputIndexes": [ 1659 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1659, 1659 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2450", "outputIndexes": [ 1660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651, 1660, 1654 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_output_0", "outputIndexes": [ 1661 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1662 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2458", "outputIndexes": [ 1663 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2461", "outputIndexes": [ 1664 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1652, 1663, 1664, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2464", "outputIndexes": [ 1665 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1665 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2465", "outputIndexes": [ 1666 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1666 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2466", "outputIndexes": [ 1667 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1667, 1666 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2467", "outputIndexes": [ 1668 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651, 1668, 1654 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_1_output_0", "outputIndexes": [ 1669 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1670 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1662, 1670, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_output_0", "outputIndexes": [ 1671 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1650, 1671 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_output_0", "outputIndexes": [ 1672 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_output_0", "outputIndexes": [ 1673 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_2_output_0", "outputIndexes": [ 1674 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1674 ] , "main_type": "NONE", "name": "Shape2474", "outputIndexes": [ 1675 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1674 ] , "main_type": "NONE", "name": "Rank2476", "outputIndexes": [ 1676 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1676, 1676 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2478", "outputIndexes": [ 1677 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2479", "outputIndexes": [ 1678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1677, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2481", "outputIndexes": [ 1679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2482", "outputIndexes": [ 1680 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1675, 1678, 1680, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2485", "outputIndexes": [ 1681 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1681 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2486", "outputIndexes": [ 1682 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1682 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2487", "outputIndexes": [ 1683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1683, 1682 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2488", "outputIndexes": [ 1684 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1674, 1684, 1677 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_2_output_0", "outputIndexes": [ 1685 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1685, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_output_0", "outputIndexes": [ 1686 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1687 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 1687, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_1_output_0", "outputIndexes": [ 1688 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1688 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_output_0", "outputIndexes": [ 1689 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1690 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 20, 1690, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_output_0", "outputIndexes": [ 1691 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1689, 1691 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_3_output_0", "outputIndexes": [ 1692 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1692, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_1_output_0", "outputIndexes": [ 1693 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1673, 1693 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_output_0", "outputIndexes": [ 1694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3402 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2218953450, 2097174, 262144, 0, 0 ] } , "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": [ 3407 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3407 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3408 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3408 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1695 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1696 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1697 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696, 1697, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_1_output_0", "outputIndexes": [ 1698 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695, 1698 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_1_output_0", "outputIndexes": [ 1699 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_2_output_0", "outputIndexes": [ 1700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699 ] , "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_3_output_0", "outputIndexes": [ 1701 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1701 ] , "main_type": "NONE", "name": "Shape2507", "outputIndexes": [ 1702 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1701 ] , "main_type": "NONE", "name": "Rank2509", "outputIndexes": [ 1703 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1703, 1703 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2511", "outputIndexes": [ 1704 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1704 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2512", "outputIndexes": [ 1705 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1704, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2514", "outputIndexes": [ 1706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1706 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2515", "outputIndexes": [ 1707 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1702, 1705, 1707, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2518", "outputIndexes": [ 1708 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1708 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2519", "outputIndexes": [ 1709 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1709 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2520", "outputIndexes": [ 1710 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1710, 1709 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2521", "outputIndexes": [ 1711 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1701, 1711, 1704 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.18/self_attn/Gather_3_output_0", "outputIndexes": [ 1712 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Div_1_output_0", "outputIndexes": [ 1713 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1713, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1714 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 1714, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_3_output_0", "outputIndexes": [ 1715 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.18/self_attn/Neg_1_output_0", "outputIndexes": [ 1716 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1713, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1717 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 20, 1717, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.18/self_attn/Slice_2_output_0", "outputIndexes": [ 1718 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1716, 1718 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.18/self_attn/Concat_4_output_0", "outputIndexes": [ 1719 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1719, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Mul_3_output_0", "outputIndexes": [ 1720 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1700, 1720 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/self_attn/Add_1_output_0", "outputIndexes": [ 1721 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3402 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2221312768, 2097174, 262144, 0, 0 ] } , "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": [ 3411 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3411 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3412 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3412 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1722 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1723 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.18/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1724 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1723, 1724, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.18/self_attn/Concat_2_output_0", "outputIndexes": [ 1725 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1722, 1725 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.18/self_attn/Reshape_2_output_0", "outputIndexes": [ 1726 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1694, 1721, 1726, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.18/self_attn/FusedAttention", "outputIndexes": [ 1727 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1727 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3413 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3413 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3414 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3414 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2223672086, 8388630, 1048576, 0, 0 ] } , "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": [ 3415 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3416 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3416 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1728 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 1728 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_output_0", "outputIndexes": [ 1729 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1729 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2233109292, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.18/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1730 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1730 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3417 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3417 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3418 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3418 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2233142060, 29360150, 3670016, 0, 0 ] } , "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": [ 3419 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3419 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3420 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3420 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1731 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1731 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.18/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1732 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3418 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2266172226, 29360150, 3670016, 0, 0 ] } , "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": [ 3423 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3423 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3424 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3424 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1732, 1733 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/mlp/Mul_output_0", "outputIndexes": [ 1734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3425 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3425 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3426 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3426 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2299202392, 29360150, 3670016, 0, 0 ] } , "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": [ 3427 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3427 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3428 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3428 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1729, 1735 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.18/Add_1_output_0", "outputIndexes": [ 1736 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1736, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/Reshape_output_0", "outputIndexes": [ 1737 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2332232558, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.19/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1738 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1738 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3429 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3429 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3430 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3430 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2332265326, 8388630, 1048576, 0, 0 ] } , "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": [ 3431 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3431 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3432 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1739 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1738 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_output_0", "outputIndexes": [ 1740 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1740 ] , "main_type": "NONE", "name": "Shape2567", "outputIndexes": [ 1741 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1740 ] , "main_type": "NONE", "name": "Rank2569", "outputIndexes": [ 1742 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1742, 1742 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2571", "outputIndexes": [ 1743 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2572", "outputIndexes": [ 1744 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2574", "outputIndexes": [ 1745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2575", "outputIndexes": [ 1746 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 1744, 1746, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2578", "outputIndexes": [ 1747 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1747 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2579", "outputIndexes": [ 1748 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1748, 1748 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2581", "outputIndexes": [ 1749 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1740, 1749, 1743 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_output_0", "outputIndexes": [ 1750 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1751 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2589", "outputIndexes": [ 1752 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2592", "outputIndexes": [ 1753 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 1752, 1753, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2595", "outputIndexes": [ 1754 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1754 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2596", "outputIndexes": [ 1755 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1755 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2597", "outputIndexes": [ 1756 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1756, 1755 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2598", "outputIndexes": [ 1757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1740, 1757, 1743 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_1_output_0", "outputIndexes": [ 1758 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1759 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1751, 1759, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_output_0", "outputIndexes": [ 1760 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739, 1760 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_output_0", "outputIndexes": [ 1761 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_output_0", "outputIndexes": [ 1762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_2_output_0", "outputIndexes": [ 1763 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1763 ] , "main_type": "NONE", "name": "Shape2605", "outputIndexes": [ 1764 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1763 ] , "main_type": "NONE", "name": "Rank2607", "outputIndexes": [ 1765 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1765, 1765 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2609", "outputIndexes": [ 1766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2610", "outputIndexes": [ 1767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2612", "outputIndexes": [ 1768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1768 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2613", "outputIndexes": [ 1769 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1764, 1767, 1769, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2616", "outputIndexes": [ 1770 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1770 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2617", "outputIndexes": [ 1771 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1771 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2618", "outputIndexes": [ 1772 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1772, 1771 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2619", "outputIndexes": [ 1773 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 1773, 1766 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_2_output_0", "outputIndexes": [ 1774 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1774, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_output_0", "outputIndexes": [ 1775 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1776 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 1776, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_1_output_0", "outputIndexes": [ 1777 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1777 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_output_0", "outputIndexes": [ 1778 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1779 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 20, 1779, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_output_0", "outputIndexes": [ 1780 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1778, 1780 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_3_output_0", "outputIndexes": [ 1781 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1781, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_1_output_0", "outputIndexes": [ 1782 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1762, 1782 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_output_0", "outputIndexes": [ 1783 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3430 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2341702532, 2097174, 262144, 0, 0 ] } , "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": [ 3435 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3435 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3436 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3436 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1784 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1785 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1786 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785, 1786, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_1_output_0", "outputIndexes": [ 1787 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1784, 1787 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_1_output_0", "outputIndexes": [ 1788 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_2_output_0", "outputIndexes": [ 1789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788 ] , "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_3_output_0", "outputIndexes": [ 1790 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1790 ] , "main_type": "NONE", "name": "Shape2638", "outputIndexes": [ 1791 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1790 ] , "main_type": "NONE", "name": "Rank2640", "outputIndexes": [ 1792 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 1792 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2642", "outputIndexes": [ 1793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1793 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2643", "outputIndexes": [ 1794 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1793, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2645", "outputIndexes": [ 1795 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1795 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2646", "outputIndexes": [ 1796 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1791, 1794, 1796, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2649", "outputIndexes": [ 1797 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1797 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2650", "outputIndexes": [ 1798 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1798 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2651", "outputIndexes": [ 1799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1799, 1798 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2652", "outputIndexes": [ 1800 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 1800, 1793 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.19/self_attn/Gather_3_output_0", "outputIndexes": [ 1801 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Div_1_output_0", "outputIndexes": [ 1802 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1802, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1803 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 1803, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_3_output_0", "outputIndexes": [ 1804 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1804 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.19/self_attn/Neg_1_output_0", "outputIndexes": [ 1805 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1802, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 20, 1806, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.19/self_attn/Slice_2_output_0", "outputIndexes": [ 1807 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 1807 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.19/self_attn/Concat_4_output_0", "outputIndexes": [ 1808 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1808, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Mul_3_output_0", "outputIndexes": [ 1809 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1789, 1809 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/self_attn/Add_1_output_0", "outputIndexes": [ 1810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3430 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2344061850, 2097174, 262144, 0, 0 ] } , "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": [ 3439 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3439 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3440 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3440 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1811 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1812 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.19/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1813 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1812, 1813, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.19/self_attn/Concat_2_output_0", "outputIndexes": [ 1814 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1811, 1814 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.19/self_attn/Reshape_2_output_0", "outputIndexes": [ 1815 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1783, 1810, 1815, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.19/self_attn/FusedAttention", "outputIndexes": [ 1816 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1816 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3441 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3441 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3442 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3442 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2346421168, 8388630, 1048576, 0, 0 ] } , "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": [ 3443 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3443 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3444 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3444 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1817 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737, 1817 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_output_0", "outputIndexes": [ 1818 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2355858374, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.19/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1819 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3445 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3445 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3446 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3446 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2355891142, 29360150, 3670016, 0, 0 ] } , "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": [ 3447 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3447 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3448 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3448 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1820 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1820 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.19/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1821 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3446 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2388921308, 29360150, 3670016, 0, 0 ] } , "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": [ 3451 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3451 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3452 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3452 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1822 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821, 1822 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/mlp/Mul_output_0", "outputIndexes": [ 1823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1823 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3453 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3453 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3454 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3454 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2421951474, 29360150, 3670016, 0, 0 ] } , "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": [ 3455 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3455 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3456 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3456 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1824 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818, 1824 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.19/Add_1_output_0", "outputIndexes": [ 1825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1825, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/Reshape_output_0", "outputIndexes": [ 1826 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2454981640, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.20/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1827 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3457 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3457 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3458 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3458 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2455014408, 8388630, 1048576, 0, 0 ] } , "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": [ 3459 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3459 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3460 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3460 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1828 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_output_0", "outputIndexes": [ 1829 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1829 ] , "main_type": "NONE", "name": "Shape2698", "outputIndexes": [ 1830 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1829 ] , "main_type": "NONE", "name": "Rank2700", "outputIndexes": [ 1831 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1831, 1831 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2702", "outputIndexes": [ 1832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2703", "outputIndexes": [ 1833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2705", "outputIndexes": [ 1834 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2706", "outputIndexes": [ 1835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1830, 1833, 1835, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2709", "outputIndexes": [ 1836 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1836 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2710", "outputIndexes": [ 1837 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1837, 1837 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2712", "outputIndexes": [ 1838 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829, 1838, 1832 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_output_0", "outputIndexes": [ 1839 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1840 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2720", "outputIndexes": [ 1841 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2723", "outputIndexes": [ 1842 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1830, 1841, 1842, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2726", "outputIndexes": [ 1843 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1843 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2727", "outputIndexes": [ 1844 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1844 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2728", "outputIndexes": [ 1845 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845, 1844 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2729", "outputIndexes": [ 1846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829, 1846, 1832 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_1_output_0", "outputIndexes": [ 1847 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1848 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1840, 1848, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_output_0", "outputIndexes": [ 1849 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1828, 1849 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_output_0", "outputIndexes": [ 1850 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_output_0", "outputIndexes": [ 1851 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_2_output_0", "outputIndexes": [ 1852 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1852 ] , "main_type": "NONE", "name": "Shape2736", "outputIndexes": [ 1853 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1852 ] , "main_type": "NONE", "name": "Rank2738", "outputIndexes": [ 1854 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1854, 1854 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2740", "outputIndexes": [ 1855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2741", "outputIndexes": [ 1856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1855, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2743", "outputIndexes": [ 1857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2744", "outputIndexes": [ 1858 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1853, 1856, 1858, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2747", "outputIndexes": [ 1859 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1859 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2748", "outputIndexes": [ 1860 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1860 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2749", "outputIndexes": [ 1861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1861, 1860 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2750", "outputIndexes": [ 1862 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 1862, 1855 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_2_output_0", "outputIndexes": [ 1863 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1863, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_output_0", "outputIndexes": [ 1864 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1864, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1865 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 1865, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_1_output_0", "outputIndexes": [ 1866 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1866 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_output_0", "outputIndexes": [ 1867 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1864, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1868 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 20, 1868, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_output_0", "outputIndexes": [ 1869 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1867, 1869 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_3_output_0", "outputIndexes": [ 1870 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1870, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_1_output_0", "outputIndexes": [ 1871 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1851, 1871 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_output_0", "outputIndexes": [ 1872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3458 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2464451614, 2097174, 262144, 0, 0 ] } , "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": [ 3463 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3463 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3464 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3464 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1873 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1874 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1875 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1874, 1875, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_1_output_0", "outputIndexes": [ 1876 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873, 1876 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_1_output_0", "outputIndexes": [ 1877 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_2_output_0", "outputIndexes": [ 1878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877 ] , "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_3_output_0", "outputIndexes": [ 1879 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1879 ] , "main_type": "NONE", "name": "Shape2769", "outputIndexes": [ 1880 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1879 ] , "main_type": "NONE", "name": "Rank2771", "outputIndexes": [ 1881 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1881, 1881 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2773", "outputIndexes": [ 1882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2774", "outputIndexes": [ 1883 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2776", "outputIndexes": [ 1884 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1884 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2777", "outputIndexes": [ 1885 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1880, 1883, 1885, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2780", "outputIndexes": [ 1886 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1886 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2781", "outputIndexes": [ 1887 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1887 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2782", "outputIndexes": [ 1888 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1888, 1887 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2783", "outputIndexes": [ 1889 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879, 1889, 1882 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.20/self_attn/Gather_3_output_0", "outputIndexes": [ 1890 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1890, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Div_1_output_0", "outputIndexes": [ 1891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1892 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 1892, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_3_output_0", "outputIndexes": [ 1893 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.20/self_attn/Neg_1_output_0", "outputIndexes": [ 1894 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1895 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 20, 1895, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.20/self_attn/Slice_2_output_0", "outputIndexes": [ 1896 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1894, 1896 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.20/self_attn/Concat_4_output_0", "outputIndexes": [ 1897 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1897, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Mul_3_output_0", "outputIndexes": [ 1898 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1878, 1898 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/self_attn/Add_1_output_0", "outputIndexes": [ 1899 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3458 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2466810932, 2097174, 262144, 0, 0 ] } , "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": [ 3467 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3467 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3468 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3468 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1900 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1901 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.20/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1902 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1901, 1902, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.20/self_attn/Concat_2_output_0", "outputIndexes": [ 1903 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1900, 1903 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.20/self_attn/Reshape_2_output_0", "outputIndexes": [ 1904 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872, 1899, 1904, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.20/self_attn/FusedAttention", "outputIndexes": [ 1905 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1905 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3469 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3469 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3470 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3470 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2469170250, 8388630, 1048576, 0, 0 ] } , "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": [ 3471 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3471 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3472 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3472 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1906 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826, 1906 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_output_0", "outputIndexes": [ 1907 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2478607456, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.20/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1908 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1908 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3473 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3473 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3474 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3474 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2478640224, 29360150, 3670016, 0, 0 ] } , "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": [ 3475 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3475 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3476 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3476 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1909 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.20/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1910 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3474 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2511670390, 29360150, 3670016, 0, 0 ] } , "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": [ 3479 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3479 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3480 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3480 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1911 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1910, 1911 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/mlp/Mul_output_0", "outputIndexes": [ 1912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3481 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3481 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3482 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3482 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2544700556, 29360150, 3670016, 0, 0 ] } , "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": [ 3483 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3483 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3484 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3484 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1913 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907, 1913 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.20/Add_1_output_0", "outputIndexes": [ 1914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/Reshape_output_0", "outputIndexes": [ 1915 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1915 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2577730722, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.21/input_layernorm/Mul_1_output_0", "outputIndexes": [ 1916 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3485 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3485 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3486 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3486 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2577763490, 8388630, 1048576, 0, 0 ] } , "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": [ 3487 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3487 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3488 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3488 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1917 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_output_0", "outputIndexes": [ 1918 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1918 ] , "main_type": "NONE", "name": "Shape2829", "outputIndexes": [ 1919 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1918 ] , "main_type": "NONE", "name": "Rank2831", "outputIndexes": [ 1920 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 1920 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2833", "outputIndexes": [ 1921 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2834", "outputIndexes": [ 1922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2836", "outputIndexes": [ 1923 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2837", "outputIndexes": [ 1924 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 1922, 1924, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2840", "outputIndexes": [ 1925 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1925 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2841", "outputIndexes": [ 1926 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1926, 1926 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2843", "outputIndexes": [ 1927 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918, 1927, 1921 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_output_0", "outputIndexes": [ 1928 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_output_0", "outputIndexes": [ 1929 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2851", "outputIndexes": [ 1930 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2854", "outputIndexes": [ 1931 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 1930, 1931, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2857", "outputIndexes": [ 1932 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2858", "outputIndexes": [ 1933 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1933 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2859", "outputIndexes": [ 1934 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1934, 1933 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2860", "outputIndexes": [ 1935 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918, 1935, 1921 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_1_output_0", "outputIndexes": [ 1936 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 1937 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1929, 1937, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_output_0", "outputIndexes": [ 1938 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1917, 1938 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_output_0", "outputIndexes": [ 1939 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_output_0", "outputIndexes": [ 1940 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_2_output_0", "outputIndexes": [ 1941 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1941 ] , "main_type": "NONE", "name": "Shape2867", "outputIndexes": [ 1942 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1941 ] , "main_type": "NONE", "name": "Rank2869", "outputIndexes": [ 1943 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1943, 1943 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2871", "outputIndexes": [ 1944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2872", "outputIndexes": [ 1945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2874", "outputIndexes": [ 1946 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2875", "outputIndexes": [ 1947 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1942, 1945, 1947, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2878", "outputIndexes": [ 1948 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1948 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2879", "outputIndexes": [ 1949 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1949 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2880", "outputIndexes": [ 1950 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1950, 1949 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2881", "outputIndexes": [ 1951 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 1951, 1944 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_2_output_0", "outputIndexes": [ 1952 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1952, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_output_0", "outputIndexes": [ 1953 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1953, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 1954 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939, 1954, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_1_output_0", "outputIndexes": [ 1955 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_output_0", "outputIndexes": [ 1956 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1953, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 1957 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939, 20, 1957, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_output_0", "outputIndexes": [ 1958 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1956, 1958 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_3_output_0", "outputIndexes": [ 1959 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1959, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_1_output_0", "outputIndexes": [ 1960 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1940, 1960 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_output_0", "outputIndexes": [ 1961 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3486 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2587200696, 2097174, 262144, 0, 0 ] } , "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": [ 3491 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3491 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3492 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3492 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1962 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 1963 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 1964 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1963, 1964, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_1_output_0", "outputIndexes": [ 1965 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1962, 1965 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_1_output_0", "outputIndexes": [ 1966 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_2_output_0", "outputIndexes": [ 1967 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966 ] , "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_3_output_0", "outputIndexes": [ 1968 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "Shape2900", "outputIndexes": [ 1969 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "Rank2902", "outputIndexes": [ 1970 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1970, 1970 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2904", "outputIndexes": [ 1971 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2905", "outputIndexes": [ 1972 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2907", "outputIndexes": [ 1973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1973 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2908", "outputIndexes": [ 1974 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1969, 1972, 1974, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2911", "outputIndexes": [ 1975 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2912", "outputIndexes": [ 1976 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 1976 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2913", "outputIndexes": [ 1977 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1977, 1976 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2914", "outputIndexes": [ 1978 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 1978, 1971 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.21/self_attn/Gather_3_output_0", "outputIndexes": [ 1979 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1979, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Div_1_output_0", "outputIndexes": [ 1980 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1980, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 1981 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 1981, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_3_output_0", "outputIndexes": [ 1982 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.21/self_attn/Neg_1_output_0", "outputIndexes": [ 1983 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1980, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 1984 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 20, 1984, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.21/self_attn/Slice_2_output_0", "outputIndexes": [ 1985 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1983, 1985 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.21/self_attn/Concat_4_output_0", "outputIndexes": [ 1986 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1986, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Mul_3_output_0", "outputIndexes": [ 1987 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1967, 1987 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/self_attn/Add_1_output_0", "outputIndexes": [ 1988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3486 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2589560014, 2097174, 262144, 0, 0 ] } , "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": [ 3495 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3495 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3496 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3496 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1989 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 1990 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.21/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 1991 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1990, 1991, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.21/self_attn/Concat_2_output_0", "outputIndexes": [ 1992 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1989, 1992 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.21/self_attn/Reshape_2_output_0", "outputIndexes": [ 1993 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961, 1988, 1993, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.21/self_attn/FusedAttention", "outputIndexes": [ 1994 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1994 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3497 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3498 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3498 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2591919332, 8388630, 1048576, 0, 0 ] } , "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": [ 3499 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3499 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3500 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3500 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1995 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1915, 1995 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_output_0", "outputIndexes": [ 1996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2601356538, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.21/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 1997 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1997 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3501 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3501 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3502 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3502 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2601389306, 29360150, 3670016, 0, 0 ] } , "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": [ 3503 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3503 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3504 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3504 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1998 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1998 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.21/mlp/act_fn/Mul_output_0", "outputIndexes": [ 1999 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3502 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2634419472, 29360150, 3670016, 0, 0 ] } , "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": [ 3507 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3507 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3508 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3508 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2000 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1999, 2000 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/mlp/Mul_output_0", "outputIndexes": [ 2001 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2001 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3509 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3509 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3510 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3510 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2667449638, 29360150, 3670016, 0, 0 ] } , "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": [ 3511 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3511 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3512 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3512 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2002 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996, 2002 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.21/Add_1_output_0", "outputIndexes": [ 2003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2003, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/Reshape_output_0", "outputIndexes": [ 2004 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2004 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2700479804, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.22/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2005 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3513 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3513 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3514 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3514 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2700512572, 8388630, 1048576, 0, 0 ] } , "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": [ 3515 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3515 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3516 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3516 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2006 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_output_0", "outputIndexes": [ 2007 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2007 ] , "main_type": "NONE", "name": "Shape2960", "outputIndexes": [ 2008 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2007 ] , "main_type": "NONE", "name": "Rank2962", "outputIndexes": [ 2009 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2009, 2009 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2964", "outputIndexes": [ 2010 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2965", "outputIndexes": [ 2011 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2967", "outputIndexes": [ 2012 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2968", "outputIndexes": [ 2013 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2011, 2013, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2971", "outputIndexes": [ 2014 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2014 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2972", "outputIndexes": [ 2015 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2015, 2015 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2974", "outputIndexes": [ 2016 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007, 2016, 2010 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_output_0", "outputIndexes": [ 2017 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2018 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2982", "outputIndexes": [ 2019 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2985", "outputIndexes": [ 2020 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2019, 2020, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2988", "outputIndexes": [ 2021 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2021 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2989", "outputIndexes": [ 2022 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2022 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2990", "outputIndexes": [ 2023 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2023, 2022 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2991", "outputIndexes": [ 2024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007, 2024, 2010 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_1_output_0", "outputIndexes": [ 2025 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2026 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2018, 2026, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_output_0", "outputIndexes": [ 2027 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2006, 2027 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_output_0", "outputIndexes": [ 2028 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_output_0", "outputIndexes": [ 2029 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_2_output_0", "outputIndexes": [ 2030 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2030 ] , "main_type": "NONE", "name": "Shape2998", "outputIndexes": [ 2031 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2030 ] , "main_type": "NONE", "name": "Rank3000", "outputIndexes": [ 2032 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2032, 2032 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3002", "outputIndexes": [ 2033 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3003", "outputIndexes": [ 2034 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3005", "outputIndexes": [ 2035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2035 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3006", "outputIndexes": [ 2036 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2031, 2034, 2036, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3009", "outputIndexes": [ 2037 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2037 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3010", "outputIndexes": [ 2038 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2038 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3011", "outputIndexes": [ 2039 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2039, 2038 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3012", "outputIndexes": [ 2040 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 2040, 2033 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_2_output_0", "outputIndexes": [ 2041 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2041, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_output_0", "outputIndexes": [ 2042 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2042, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2043 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 2043, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_1_output_0", "outputIndexes": [ 2044 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2044 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_output_0", "outputIndexes": [ 2045 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2042, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2046 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 20, 2046, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_output_0", "outputIndexes": [ 2047 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2045, 2047 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_3_output_0", "outputIndexes": [ 2048 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2048, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_1_output_0", "outputIndexes": [ 2049 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2029, 2049 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_output_0", "outputIndexes": [ 2050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3514 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2709949778, 2097174, 262144, 0, 0 ] } , "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": [ 3519 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3519 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3520 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3520 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2051 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2052 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2053 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052, 2053, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_1_output_0", "outputIndexes": [ 2054 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2051, 2054 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_1_output_0", "outputIndexes": [ 2055 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_2_output_0", "outputIndexes": [ 2056 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055 ] , "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_3_output_0", "outputIndexes": [ 2057 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2057 ] , "main_type": "NONE", "name": "Shape3031", "outputIndexes": [ 2058 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2057 ] , "main_type": "NONE", "name": "Rank3033", "outputIndexes": [ 2059 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059, 2059 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3035", "outputIndexes": [ 2060 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2060 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3036", "outputIndexes": [ 2061 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2060, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3038", "outputIndexes": [ 2062 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3039", "outputIndexes": [ 2063 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2058, 2061, 2063, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3042", "outputIndexes": [ 2064 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3043", "outputIndexes": [ 2065 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2065 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3044", "outputIndexes": [ 2066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2066, 2065 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3045", "outputIndexes": [ 2067 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 2067, 2060 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.22/self_attn/Gather_3_output_0", "outputIndexes": [ 2068 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Div_1_output_0", "outputIndexes": [ 2069 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2069, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2070 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 2070, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_3_output_0", "outputIndexes": [ 2071 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.22/self_attn/Neg_1_output_0", "outputIndexes": [ 2072 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2069, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2073 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 20, 2073, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.22/self_attn/Slice_2_output_0", "outputIndexes": [ 2074 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2072, 2074 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.22/self_attn/Concat_4_output_0", "outputIndexes": [ 2075 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2075, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Mul_3_output_0", "outputIndexes": [ 2076 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2056, 2076 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/self_attn/Add_1_output_0", "outputIndexes": [ 2077 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3514 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2712309096, 2097174, 262144, 0, 0 ] } , "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": [ 3523 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3523 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3524 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3524 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2078 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2079 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.22/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2080 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2079, 2080, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.22/self_attn/Concat_2_output_0", "outputIndexes": [ 2081 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2078, 2081 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.22/self_attn/Reshape_2_output_0", "outputIndexes": [ 2082 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2050, 2077, 2082, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.22/self_attn/FusedAttention", "outputIndexes": [ 2083 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2083 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3525 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3525 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3526 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3526 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2714668414, 8388630, 1048576, 0, 0 ] } , "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": [ 3527 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3527 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3528 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3528 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2084 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2004, 2084 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_output_0", "outputIndexes": [ 2085 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2724105620, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.22/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2086 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2086 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3529 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3529 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3530 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3530 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2724138388, 29360150, 3670016, 0, 0 ] } , "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": [ 3531 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3531 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3532 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3532 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2087 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.22/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2088 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3530 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2757168554, 29360150, 3670016, 0, 0 ] } , "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": [ 3535 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3535 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3536 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3536 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2089 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2088, 2089 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/mlp/Mul_output_0", "outputIndexes": [ 2090 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2090 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3537 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3537 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3538 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3538 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2790198720, 29360150, 3670016, 0, 0 ] } , "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": [ 3539 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3539 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3540 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3540 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2091 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085, 2091 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.22/Add_1_output_0", "outputIndexes": [ 2092 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2092, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/Reshape_output_0", "outputIndexes": [ 2093 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2823228886, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.23/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2094 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3541 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3542 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3542 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2823261654, 8388630, 1048576, 0, 0 ] } , "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": [ 3543 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3543 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3544 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3544 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2095 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_output_0", "outputIndexes": [ 2096 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2096 ] , "main_type": "NONE", "name": "Shape3091", "outputIndexes": [ 2097 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2096 ] , "main_type": "NONE", "name": "Rank3093", "outputIndexes": [ 2098 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 2098 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3095", "outputIndexes": [ 2099 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3096", "outputIndexes": [ 2100 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3098", "outputIndexes": [ 2101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3099", "outputIndexes": [ 2102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 2100, 2102, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3102", "outputIndexes": [ 2103 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2103 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3103", "outputIndexes": [ 2104 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2104, 2104 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3105", "outputIndexes": [ 2105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 2105, 2099 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_output_0", "outputIndexes": [ 2106 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2107 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3113", "outputIndexes": [ 2108 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3116", "outputIndexes": [ 2109 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 2108, 2109, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3119", "outputIndexes": [ 2110 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2110 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3120", "outputIndexes": [ 2111 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2111 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3121", "outputIndexes": [ 2112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2112, 2111 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3122", "outputIndexes": [ 2113 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 2113, 2099 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_1_output_0", "outputIndexes": [ 2114 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2107, 2115, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_output_0", "outputIndexes": [ 2116 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095, 2116 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_output_0", "outputIndexes": [ 2117 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_output_0", "outputIndexes": [ 2118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_2_output_0", "outputIndexes": [ 2119 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2119 ] , "main_type": "NONE", "name": "Shape3129", "outputIndexes": [ 2120 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2119 ] , "main_type": "NONE", "name": "Rank3131", "outputIndexes": [ 2121 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2121, 2121 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3133", "outputIndexes": [ 2122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3134", "outputIndexes": [ 2123 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3136", "outputIndexes": [ 2124 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3137", "outputIndexes": [ 2125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2120, 2123, 2125, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3140", "outputIndexes": [ 2126 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2126 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3141", "outputIndexes": [ 2127 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2127 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3142", "outputIndexes": [ 2128 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2128, 2127 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3143", "outputIndexes": [ 2129 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 2129, 2122 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_2_output_0", "outputIndexes": [ 2130 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2130, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_output_0", "outputIndexes": [ 2131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2131, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2132 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 2132, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_1_output_0", "outputIndexes": [ 2133 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_output_0", "outputIndexes": [ 2134 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2131, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2135 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 20, 2135, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_output_0", "outputIndexes": [ 2136 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2134, 2136 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_3_output_0", "outputIndexes": [ 2137 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2137, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_1_output_0", "outputIndexes": [ 2138 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118, 2138 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_output_0", "outputIndexes": [ 2139 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3542 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2832698860, 2097174, 262144, 0, 0 ] } , "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": [ 3547 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3547 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3548 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3548 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2140 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2141 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2141, 2142, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_1_output_0", "outputIndexes": [ 2143 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2140, 2143 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_1_output_0", "outputIndexes": [ 2144 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_2_output_0", "outputIndexes": [ 2145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144 ] , "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_3_output_0", "outputIndexes": [ 2146 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2146 ] , "main_type": "NONE", "name": "Shape3162", "outputIndexes": [ 2147 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2146 ] , "main_type": "NONE", "name": "Rank3164", "outputIndexes": [ 2148 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2148, 2148 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3166", "outputIndexes": [ 2149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3167", "outputIndexes": [ 2150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3169", "outputIndexes": [ 2151 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3170", "outputIndexes": [ 2152 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147, 2150, 2152, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3173", "outputIndexes": [ 2153 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2153 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3174", "outputIndexes": [ 2154 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2154 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3175", "outputIndexes": [ 2155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2155, 2154 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3176", "outputIndexes": [ 2156 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146, 2156, 2149 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.23/self_attn/Gather_3_output_0", "outputIndexes": [ 2157 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Div_1_output_0", "outputIndexes": [ 2158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2159 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144, 2159, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_3_output_0", "outputIndexes": [ 2160 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.23/self_attn/Neg_1_output_0", "outputIndexes": [ 2161 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2162 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144, 20, 2162, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.23/self_attn/Slice_2_output_0", "outputIndexes": [ 2163 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161, 2163 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.23/self_attn/Concat_4_output_0", "outputIndexes": [ 2164 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2164, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Mul_3_output_0", "outputIndexes": [ 2165 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2145, 2165 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/self_attn/Add_1_output_0", "outputIndexes": [ 2166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3542 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2835058178, 2097174, 262144, 0, 0 ] } , "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": [ 3551 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3551 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3552 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3552 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2167 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2168 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.23/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2169 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2168, 2169, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.23/self_attn/Concat_2_output_0", "outputIndexes": [ 2170 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2167, 2170 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.23/self_attn/Reshape_2_output_0", "outputIndexes": [ 2171 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2139, 2166, 2171, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.23/self_attn/FusedAttention", "outputIndexes": [ 2172 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2172 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3553 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3553 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3554 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3554 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2837417496, 8388630, 1048576, 0, 0 ] } , "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": [ 3555 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3555 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3556 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3556 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2173 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093, 2173 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_output_0", "outputIndexes": [ 2174 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2174 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2846854702, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.23/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2175 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2175 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3557 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3557 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3558 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3558 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2846887470, 29360150, 3670016, 0, 0 ] } , "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": [ 3559 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3559 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3560 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3560 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2176 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2176 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.23/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2177 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3558 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2879917636, 29360150, 3670016, 0, 0 ] } , "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": [ 3563 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3563 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3564 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3564 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2178 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177, 2178 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/mlp/Mul_output_0", "outputIndexes": [ 2179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2179 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3565 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3565 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3566 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3566 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2912947802, 29360150, 3670016, 0, 0 ] } , "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": [ 3567 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3567 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3568 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3568 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2180 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2174, 2180 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.23/Add_1_output_0", "outputIndexes": [ 2181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2181, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/Reshape_output_0", "outputIndexes": [ 2182 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2182 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2945977968, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.24/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2183 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3569 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3569 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3570 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3570 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2946010736, 8388630, 1048576, 0, 0 ] } , "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": [ 3571 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3571 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3572 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3572 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2184 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_output_0", "outputIndexes": [ 2185 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2185 ] , "main_type": "NONE", "name": "Shape3222", "outputIndexes": [ 2186 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2185 ] , "main_type": "NONE", "name": "Rank3224", "outputIndexes": [ 2187 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187, 2187 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3226", "outputIndexes": [ 2188 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3227", "outputIndexes": [ 2189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3229", "outputIndexes": [ 2190 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3230", "outputIndexes": [ 2191 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186, 2189, 2191, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3233", "outputIndexes": [ 2192 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2192 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3234", "outputIndexes": [ 2193 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2193, 2193 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3236", "outputIndexes": [ 2194 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2185, 2194, 2188 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_output_0", "outputIndexes": [ 2195 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2195, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2196 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3244", "outputIndexes": [ 2197 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3247", "outputIndexes": [ 2198 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186, 2197, 2198, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3250", "outputIndexes": [ 2199 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2199 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3251", "outputIndexes": [ 2200 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2200 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3252", "outputIndexes": [ 2201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2201, 2200 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3253", "outputIndexes": [ 2202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2185, 2202, 2188 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_1_output_0", "outputIndexes": [ 2203 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2204 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2196, 2204, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_output_0", "outputIndexes": [ 2205 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2184, 2205 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_output_0", "outputIndexes": [ 2206 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_output_0", "outputIndexes": [ 2207 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_2_output_0", "outputIndexes": [ 2208 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2208 ] , "main_type": "NONE", "name": "Shape3260", "outputIndexes": [ 2209 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2208 ] , "main_type": "NONE", "name": "Rank3262", "outputIndexes": [ 2210 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2210, 2210 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3264", "outputIndexes": [ 2211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3265", "outputIndexes": [ 2212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3267", "outputIndexes": [ 2213 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2213 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3268", "outputIndexes": [ 2214 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2209, 2212, 2214, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3271", "outputIndexes": [ 2215 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3272", "outputIndexes": [ 2216 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2216 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3273", "outputIndexes": [ 2217 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2217, 2216 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3274", "outputIndexes": [ 2218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208, 2218, 2211 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_2_output_0", "outputIndexes": [ 2219 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2219, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_output_0", "outputIndexes": [ 2220 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2221 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 2221, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_1_output_0", "outputIndexes": [ 2222 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2222 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_output_0", "outputIndexes": [ 2223 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2224 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 20, 2224, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_output_0", "outputIndexes": [ 2225 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2223, 2225 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_3_output_0", "outputIndexes": [ 2226 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2226, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_1_output_0", "outputIndexes": [ 2227 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2207, 2227 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_output_0", "outputIndexes": [ 2228 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3570 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2955447942, 2097174, 262144, 0, 0 ] } , "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": [ 3575 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3575 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3576 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3576 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2229 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2195, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2230 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2230, 2231, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_1_output_0", "outputIndexes": [ 2232 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2229, 2232 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_1_output_0", "outputIndexes": [ 2233 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2233, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_2_output_0", "outputIndexes": [ 2234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2233 ] , "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_3_output_0", "outputIndexes": [ 2235 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2235 ] , "main_type": "NONE", "name": "Shape3293", "outputIndexes": [ 2236 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2235 ] , "main_type": "NONE", "name": "Rank3295", "outputIndexes": [ 2237 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2237, 2237 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3297", "outputIndexes": [ 2238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3298", "outputIndexes": [ 2239 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3300", "outputIndexes": [ 2240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3301", "outputIndexes": [ 2241 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2236, 2239, 2241, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3304", "outputIndexes": [ 2242 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2242 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3305", "outputIndexes": [ 2243 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2243 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3306", "outputIndexes": [ 2244 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2244, 2243 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3307", "outputIndexes": [ 2245 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2235, 2245, 2238 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.24/self_attn/Gather_3_output_0", "outputIndexes": [ 2246 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2246, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Div_1_output_0", "outputIndexes": [ 2247 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2247, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2248 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2233, 2248, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_3_output_0", "outputIndexes": [ 2249 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.24/self_attn/Neg_1_output_0", "outputIndexes": [ 2250 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2247, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2251 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2233, 20, 2251, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.24/self_attn/Slice_2_output_0", "outputIndexes": [ 2252 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2250, 2252 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.24/self_attn/Concat_4_output_0", "outputIndexes": [ 2253 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2253, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Mul_3_output_0", "outputIndexes": [ 2254 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2234, 2254 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/self_attn/Add_1_output_0", "outputIndexes": [ 2255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3570 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2957807260, 2097174, 262144, 0, 0 ] } , "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": [ 3579 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3579 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3580 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3580 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2256 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2195, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2257 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.24/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2258 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257, 2258, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.24/self_attn/Concat_2_output_0", "outputIndexes": [ 2259 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2256, 2259 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.24/self_attn/Reshape_2_output_0", "outputIndexes": [ 2260 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2228, 2255, 2260, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.24/self_attn/FusedAttention", "outputIndexes": [ 2261 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2261 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3581 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3581 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3582 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3582 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2960166578, 8388630, 1048576, 0, 0 ] } , "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": [ 3583 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3583 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3584 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3584 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2262 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2182, 2262 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_output_0", "outputIndexes": [ 2263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 2969603784, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.24/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2264 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2264 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3585 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3585 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3586 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3586 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2969636552, 29360150, 3670016, 0, 0 ] } , "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": [ 3587 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3587 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3588 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3588 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2265 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.24/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2266 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3586 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3002666718, 29360150, 3670016, 0, 0 ] } , "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": [ 3591 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3591 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3592 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3592 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2267 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2266, 2267 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/mlp/Mul_output_0", "outputIndexes": [ 2268 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2268 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3593 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3593 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3594 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3594 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3035696884, 29360150, 3670016, 0, 0 ] } , "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": [ 3595 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3595 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3596 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3596 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263, 2269 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.24/Add_1_output_0", "outputIndexes": [ 2270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/Reshape_output_0", "outputIndexes": [ 2271 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3068727050, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.25/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2272 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2272 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3597 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3597 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3598 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3598 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3068759818, 8388630, 1048576, 0, 0 ] } , "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": [ 3599 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3599 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3600 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3600 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2273 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2272 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_output_0", "outputIndexes": [ 2274 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2274 ] , "main_type": "NONE", "name": "Shape3353", "outputIndexes": [ 2275 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2274 ] , "main_type": "NONE", "name": "Rank3355", "outputIndexes": [ 2276 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276, 2276 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3357", "outputIndexes": [ 2277 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3358", "outputIndexes": [ 2278 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3360", "outputIndexes": [ 2279 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3361", "outputIndexes": [ 2280 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2275, 2278, 2280, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3364", "outputIndexes": [ 2281 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3365", "outputIndexes": [ 2282 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2282, 2282 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3367", "outputIndexes": [ 2283 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2274, 2283, 2277 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_output_0", "outputIndexes": [ 2284 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2285 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3375", "outputIndexes": [ 2286 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3378", "outputIndexes": [ 2287 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2275, 2286, 2287, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3381", "outputIndexes": [ 2288 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2288 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3382", "outputIndexes": [ 2289 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2289 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3383", "outputIndexes": [ 2290 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2290, 2289 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3384", "outputIndexes": [ 2291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2274, 2291, 2277 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_1_output_0", "outputIndexes": [ 2292 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2293 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2285, 2293, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_output_0", "outputIndexes": [ 2294 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273, 2294 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_output_0", "outputIndexes": [ 2295 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2295, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_output_0", "outputIndexes": [ 2296 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2295 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_2_output_0", "outputIndexes": [ 2297 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2297 ] , "main_type": "NONE", "name": "Shape3391", "outputIndexes": [ 2298 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2297 ] , "main_type": "NONE", "name": "Rank3393", "outputIndexes": [ 2299 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 2299 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3395", "outputIndexes": [ 2300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3396", "outputIndexes": [ 2301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3398", "outputIndexes": [ 2302 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2302 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3399", "outputIndexes": [ 2303 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2298, 2301, 2303, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3402", "outputIndexes": [ 2304 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3403", "outputIndexes": [ 2305 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2305 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3404", "outputIndexes": [ 2306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2306, 2305 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3405", "outputIndexes": [ 2307 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297, 2307, 2300 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_2_output_0", "outputIndexes": [ 2308 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2308, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_output_0", "outputIndexes": [ 2309 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2310 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2295, 2310, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_1_output_0", "outputIndexes": [ 2311 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2311 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_output_0", "outputIndexes": [ 2312 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2313 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2295, 20, 2313, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_output_0", "outputIndexes": [ 2314 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2312, 2314 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_3_output_0", "outputIndexes": [ 2315 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2315, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_1_output_0", "outputIndexes": [ 2316 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2296, 2316 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_output_0", "outputIndexes": [ 2317 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3598 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3078197024, 2097174, 262144, 0, 0 ] } , "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": [ 3603 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3603 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3604 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3604 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2318 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2319 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2320 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2319, 2320, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_1_output_0", "outputIndexes": [ 2321 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2318, 2321 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_1_output_0", "outputIndexes": [ 2322 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2322, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_2_output_0", "outputIndexes": [ 2323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2322 ] , "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_3_output_0", "outputIndexes": [ 2324 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2324 ] , "main_type": "NONE", "name": "Shape3424", "outputIndexes": [ 2325 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2324 ] , "main_type": "NONE", "name": "Rank3426", "outputIndexes": [ 2326 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2326, 2326 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3428", "outputIndexes": [ 2327 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3429", "outputIndexes": [ 2328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3431", "outputIndexes": [ 2329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3432", "outputIndexes": [ 2330 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2325, 2328, 2330, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3435", "outputIndexes": [ 2331 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3436", "outputIndexes": [ 2332 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2332 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3437", "outputIndexes": [ 2333 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333, 2332 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3438", "outputIndexes": [ 2334 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324, 2334, 2327 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.25/self_attn/Gather_3_output_0", "outputIndexes": [ 2335 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2335, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Div_1_output_0", "outputIndexes": [ 2336 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2337 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2322, 2337, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_3_output_0", "outputIndexes": [ 2338 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.25/self_attn/Neg_1_output_0", "outputIndexes": [ 2339 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2340 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2322, 20, 2340, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.25/self_attn/Slice_2_output_0", "outputIndexes": [ 2341 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2339, 2341 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.25/self_attn/Concat_4_output_0", "outputIndexes": [ 2342 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2342, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Mul_3_output_0", "outputIndexes": [ 2343 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2323, 2343 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/self_attn/Add_1_output_0", "outputIndexes": [ 2344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3598 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3080556342, 2097174, 262144, 0, 0 ] } , "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": [ 3607 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3607 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3608 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3608 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2345 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2346 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.25/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2347 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2346, 2347, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.25/self_attn/Concat_2_output_0", "outputIndexes": [ 2348 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2345, 2348 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.25/self_attn/Reshape_2_output_0", "outputIndexes": [ 2349 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2317, 2344, 2349, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.25/self_attn/FusedAttention", "outputIndexes": [ 2350 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2350 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3609 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3609 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3610 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3610 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3082915660, 8388630, 1048576, 0, 0 ] } , "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": [ 3611 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3611 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3612 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3612 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2351 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271, 2351 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_output_0", "outputIndexes": [ 2352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2352 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3092352866, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.25/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2353 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2353 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3613 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3613 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3614 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3614 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3092385634, 29360150, 3670016, 0, 0 ] } , "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": [ 3615 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3615 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3616 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3616 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2354 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2354 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.25/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2355 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3614 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3125415800, 29360150, 3670016, 0, 0 ] } , "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": [ 3619 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3619 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3620 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3620 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2356 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2355, 2356 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/mlp/Mul_output_0", "outputIndexes": [ 2357 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2357 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3621 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3621 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3622 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3622 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3158445966, 29360150, 3670016, 0, 0 ] } , "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": [ 3623 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3623 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3624 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3624 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2358 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2352, 2358 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.25/Add_1_output_0", "outputIndexes": [ 2359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2359, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/Reshape_output_0", "outputIndexes": [ 2360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2360 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3191476132, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.26/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2361 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3625 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3625 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3626 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3626 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3191508900, 8388630, 1048576, 0, 0 ] } , "name": "/layers.26/self_attn/q_proj/Linear", "outputIndexes": [ 3627 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3627 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3628 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3628 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2362 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_output_0", "outputIndexes": [ 2363 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2363 ] , "main_type": "NONE", "name": "Shape3484", "outputIndexes": [ 2364 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2363 ] , "main_type": "NONE", "name": "Rank3486", "outputIndexes": [ 2365 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2365, 2365 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3488", "outputIndexes": [ 2366 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3489", "outputIndexes": [ 2367 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3491", "outputIndexes": [ 2368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3492", "outputIndexes": [ 2369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364, 2367, 2369, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3495", "outputIndexes": [ 2370 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3496", "outputIndexes": [ 2371 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2371, 2371 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3498", "outputIndexes": [ 2372 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363, 2372, 2366 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_output_0", "outputIndexes": [ 2373 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2374 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3506", "outputIndexes": [ 2375 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3509", "outputIndexes": [ 2376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364, 2375, 2376, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3512", "outputIndexes": [ 2377 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3513", "outputIndexes": [ 2378 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2378 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3514", "outputIndexes": [ 2379 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379, 2378 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3515", "outputIndexes": [ 2380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363, 2380, 2366 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_1_output_0", "outputIndexes": [ 2381 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2381, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2382 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2374, 2382, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_output_0", "outputIndexes": [ 2383 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2362, 2383 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_output_0", "outputIndexes": [ 2384 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_output_0", "outputIndexes": [ 2385 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_2_output_0", "outputIndexes": [ 2386 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2386 ] , "main_type": "NONE", "name": "Shape3522", "outputIndexes": [ 2387 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2386 ] , "main_type": "NONE", "name": "Rank3524", "outputIndexes": [ 2388 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2388, 2388 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3526", "outputIndexes": [ 2389 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3527", "outputIndexes": [ 2390 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2389, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3529", "outputIndexes": [ 2391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2391 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3530", "outputIndexes": [ 2392 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2387, 2390, 2392, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3533", "outputIndexes": [ 2393 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2393 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3534", "outputIndexes": [ 2394 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2394 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3535", "outputIndexes": [ 2395 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395, 2394 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3536", "outputIndexes": [ 2396 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386, 2396, 2389 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_2_output_0", "outputIndexes": [ 2397 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_output_0", "outputIndexes": [ 2398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2398, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2399 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384, 2399, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_1_output_0", "outputIndexes": [ 2400 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2400 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_output_0", "outputIndexes": [ 2401 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2398, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2402 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384, 20, 2402, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_output_0", "outputIndexes": [ 2403 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2401, 2403 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_3_output_0", "outputIndexes": [ 2404 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2404, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_1_output_0", "outputIndexes": [ 2405 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2385, 2405 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_output_0", "outputIndexes": [ 2406 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3626 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3200946106, 2097174, 262144, 0, 0 ] } , "name": "/layers.26/self_attn/k_proj/Linear", "outputIndexes": [ 3631 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3631 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3632 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3632 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2407 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2408 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2381, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2408, 2409, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_1_output_0", "outputIndexes": [ 2410 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2407, 2410 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_1_output_0", "outputIndexes": [ 2411 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_2_output_0", "outputIndexes": [ 2412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411 ] , "main_type": "NONE", "name": "/blocks.26/self_attn/Shape_3_output_0", "outputIndexes": [ 2413 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2413 ] , "main_type": "NONE", "name": "Shape3555", "outputIndexes": [ 2414 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2413 ] , "main_type": "NONE", "name": "Rank3557", "outputIndexes": [ 2415 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2415, 2415 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3559", "outputIndexes": [ 2416 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2416 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3560", "outputIndexes": [ 2417 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2416, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3562", "outputIndexes": [ 2418 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2418 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3563", "outputIndexes": [ 2419 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2414, 2417, 2419, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3566", "outputIndexes": [ 2420 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2420 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3567", "outputIndexes": [ 2421 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2421 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3568", "outputIndexes": [ 2422 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2422, 2421 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3569", "outputIndexes": [ 2423 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413, 2423, 2416 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.26/self_attn/Gather_3_output_0", "outputIndexes": [ 2424 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2424, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Div_1_output_0", "outputIndexes": [ 2425 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2425, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2426 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411, 2426, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_3_output_0", "outputIndexes": [ 2427 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.26/self_attn/Neg_1_output_0", "outputIndexes": [ 2428 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2425, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2429 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411, 20, 2429, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.26/self_attn/Slice_2_output_0", "outputIndexes": [ 2430 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2428, 2430 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.26/self_attn/Concat_4_output_0", "outputIndexes": [ 2431 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2431, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Mul_3_output_0", "outputIndexes": [ 2432 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2412, 2432 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/self_attn/Add_1_output_0", "outputIndexes": [ 2433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3626 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3203305424, 2097174, 262144, 0, 0 ] } , "name": "/layers.26/self_attn/v_proj/Linear", "outputIndexes": [ 3635 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3635 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3636 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3636 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2434 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2435 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2381, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.26/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2436 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2435, 2436, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.26/self_attn/Concat_2_output_0", "outputIndexes": [ 2437 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2434, 2437 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.26/self_attn/Reshape_2_output_0", "outputIndexes": [ 2438 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406, 2433, 2438, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.26/self_attn/FusedAttention", "outputIndexes": [ 2439 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2439 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3637 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3637 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3638 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3638 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3205664742, 8388630, 1048576, 0, 0 ] } , "name": "/layers.26/self_attn/o_proj/Linear", "outputIndexes": [ 3639 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3639 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3640 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3640 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2440 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2360, 2440 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_output_0", "outputIndexes": [ 2441 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2441 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3215101948, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.26/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2442 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2442 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3641 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3641 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3642 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3642 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3215134716, 29360150, 3670016, 0, 0 ] } , "name": "/layers.26/mlp/gate_proj/Linear", "outputIndexes": [ 3643 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3643 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3644 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3644 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2443 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.26/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2444 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3642 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3248164882, 29360150, 3670016, 0, 0 ] } , "name": "/layers.26/mlp/up_proj/Linear", "outputIndexes": [ 3647 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3647 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3648 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3648 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2445 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2444, 2445 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/mlp/Mul_output_0", "outputIndexes": [ 2446 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2446 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3649 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3649 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3650 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3650 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3281195048, 29360150, 3670016, 0, 0 ] } , "name": "/layers.26/mlp/down_proj/Linear", "outputIndexes": [ 3651 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3651 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3652 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3652 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2447 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2441, 2447 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.26/Add_1_output_0", "outputIndexes": [ 2448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2448, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/Reshape_output_0", "outputIndexes": [ 2449 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2449 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3314225214, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.27/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2450 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2450 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3653 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3653 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3654 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3314257982, 8388630, 1048576, 0, 0 ] } , "name": "/layers.27/self_attn/q_proj/Linear", "outputIndexes": [ 3655 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3655 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3656 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3656 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2451 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2450 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_output_0", "outputIndexes": [ 2452 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2452 ] , "main_type": "NONE", "name": "Shape3615", "outputIndexes": [ 2453 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2452 ] , "main_type": "NONE", "name": "Rank3617", "outputIndexes": [ 2454 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454, 2454 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3619", "outputIndexes": [ 2455 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3620", "outputIndexes": [ 2456 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3622", "outputIndexes": [ 2457 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3623", "outputIndexes": [ 2458 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2453, 2456, 2458, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3626", "outputIndexes": [ 2459 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2459 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3627", "outputIndexes": [ 2460 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2460, 2460 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3629", "outputIndexes": [ 2461 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2452, 2461, 2455 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_output_0", "outputIndexes": [ 2462 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2462, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2463 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3637", "outputIndexes": [ 2464 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3640", "outputIndexes": [ 2465 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2453, 2464, 2465, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3643", "outputIndexes": [ 2466 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2466 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3644", "outputIndexes": [ 2467 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2467 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3645", "outputIndexes": [ 2468 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2468, 2467 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3646", "outputIndexes": [ 2469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2452, 2469, 2455 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_1_output_0", "outputIndexes": [ 2470 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2471 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2463, 2471, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_output_0", "outputIndexes": [ 2472 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 2472 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_output_0", "outputIndexes": [ 2473 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2473, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_output_0", "outputIndexes": [ 2474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2473 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_2_output_0", "outputIndexes": [ 2475 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2475 ] , "main_type": "NONE", "name": "Shape3653", "outputIndexes": [ 2476 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2475 ] , "main_type": "NONE", "name": "Rank3655", "outputIndexes": [ 2477 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477, 2477 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3657", "outputIndexes": [ 2478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3658", "outputIndexes": [ 2479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3660", "outputIndexes": [ 2480 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2480 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3661", "outputIndexes": [ 2481 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2476, 2479, 2481, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3664", "outputIndexes": [ 2482 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2482 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3665", "outputIndexes": [ 2483 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2483 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3666", "outputIndexes": [ 2484 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2484, 2483 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3667", "outputIndexes": [ 2485 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2475, 2485, 2478 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_2_output_0", "outputIndexes": [ 2486 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2486, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_output_0", "outputIndexes": [ 2487 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2487, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2488 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2473, 2488, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_1_output_0", "outputIndexes": [ 2489 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2489 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_output_0", "outputIndexes": [ 2490 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2487, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2473, 20, 2491, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_output_0", "outputIndexes": [ 2492 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490, 2492 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_3_output_0", "outputIndexes": [ 2493 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2493, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_1_output_0", "outputIndexes": [ 2494 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2474, 2494 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_output_0", "outputIndexes": [ 2495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3323695188, 2097174, 262144, 0, 0 ] } , "name": "/layers.27/self_attn/k_proj/Linear", "outputIndexes": [ 3659 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3659 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3660 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3660 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2496 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2462, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2497 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2498 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2497, 2498, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_1_output_0", "outputIndexes": [ 2499 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2496, 2499 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_1_output_0", "outputIndexes": [ 2500 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2500, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_2_output_0", "outputIndexes": [ 2501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2500 ] , "main_type": "NONE", "name": "/blocks.27/self_attn/Shape_3_output_0", "outputIndexes": [ 2502 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2502 ] , "main_type": "NONE", "name": "Shape3686", "outputIndexes": [ 2503 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2502 ] , "main_type": "NONE", "name": "Rank3688", "outputIndexes": [ 2504 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2504, 2504 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3690", "outputIndexes": [ 2505 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2505 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3691", "outputIndexes": [ 2506 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2505, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3693", "outputIndexes": [ 2507 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2507 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3694", "outputIndexes": [ 2508 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2503, 2506, 2508, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3697", "outputIndexes": [ 2509 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2509 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3698", "outputIndexes": [ 2510 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2510 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3699", "outputIndexes": [ 2511 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2511, 2510 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3700", "outputIndexes": [ 2512 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2502, 2512, 2505 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.27/self_attn/Gather_3_output_0", "outputIndexes": [ 2513 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2513, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Div_1_output_0", "outputIndexes": [ 2514 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2514, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2500, 2515, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_3_output_0", "outputIndexes": [ 2516 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2516 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.27/self_attn/Neg_1_output_0", "outputIndexes": [ 2517 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2514, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2518 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2500, 20, 2518, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.27/self_attn/Slice_2_output_0", "outputIndexes": [ 2519 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2517, 2519 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.27/self_attn/Concat_4_output_0", "outputIndexes": [ 2520 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2520, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Mul_3_output_0", "outputIndexes": [ 2521 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501, 2521 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/self_attn/Add_1_output_0", "outputIndexes": [ 2522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3326054506, 2097174, 262144, 0, 0 ] } , "name": "/layers.27/self_attn/v_proj/Linear", "outputIndexes": [ 3663 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3663 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3664 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3664 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2523 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2462, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2524 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.27/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2525 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524, 2525, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.27/self_attn/Concat_2_output_0", "outputIndexes": [ 2526 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523, 2526 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.27/self_attn/Reshape_2_output_0", "outputIndexes": [ 2527 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495, 2522, 2527, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.27/self_attn/FusedAttention", "outputIndexes": [ 2528 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2528 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3665 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3666 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3666 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3328413824, 8388630, 1048576, 0, 0 ] } , "name": "/layers.27/self_attn/o_proj/Linear", "outputIndexes": [ 3667 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3668 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3668 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2529 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2449, 2529 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_output_0", "outputIndexes": [ 2530 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2530 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3337851030, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.27/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2531 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2531 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3669 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3670 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3670 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3337883798, 29360150, 3670016, 0, 0 ] } , "name": "/layers.27/mlp/gate_proj/Linear", "outputIndexes": [ 3671 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3671 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3672 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3672 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2532 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2532 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.27/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2533 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3670 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3370913964, 29360150, 3670016, 0, 0 ] } , "name": "/layers.27/mlp/up_proj/Linear", "outputIndexes": [ 3675 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3675 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3676 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3676 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2534 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2533, 2534 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/mlp/Mul_output_0", "outputIndexes": [ 2535 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2535 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3677 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3677 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3678 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3678 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3403944130, 29360150, 3670016, 0, 0 ] } , "name": "/layers.27/mlp/down_proj/Linear", "outputIndexes": [ 3679 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3679 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3680 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3680 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2536 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2530, 2536 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.27/Add_1_output_0", "outputIndexes": [ 2537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2537, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/Reshape_output_0", "outputIndexes": [ 2538 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2538 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3436974296, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.28/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2539 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2539 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3681 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3681 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3682 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3682 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3437007064, 8388630, 1048576, 0, 0 ] } , "name": "/layers.28/self_attn/q_proj/Linear", "outputIndexes": [ 3683 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3683 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3684 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3684 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2540 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2539 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_output_0", "outputIndexes": [ 2541 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2541 ] , "main_type": "NONE", "name": "Shape3746", "outputIndexes": [ 2542 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2541 ] , "main_type": "NONE", "name": "Rank3748", "outputIndexes": [ 2543 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2543, 2543 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3750", "outputIndexes": [ 2544 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3751", "outputIndexes": [ 2545 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3753", "outputIndexes": [ 2546 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3754", "outputIndexes": [ 2547 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2542, 2545, 2547, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3757", "outputIndexes": [ 2548 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2548 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3758", "outputIndexes": [ 2549 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549, 2549 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3760", "outputIndexes": [ 2550 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2541, 2550, 2544 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_output_0", "outputIndexes": [ 2551 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2552 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3768", "outputIndexes": [ 2553 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3771", "outputIndexes": [ 2554 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2542, 2553, 2554, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3774", "outputIndexes": [ 2555 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2555 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3775", "outputIndexes": [ 2556 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2556 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3776", "outputIndexes": [ 2557 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557, 2556 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3777", "outputIndexes": [ 2558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2541, 2558, 2544 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_1_output_0", "outputIndexes": [ 2559 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2559, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2560 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2552, 2560, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_output_0", "outputIndexes": [ 2561 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2540, 2561 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_output_0", "outputIndexes": [ 2562 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_output_0", "outputIndexes": [ 2563 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_2_output_0", "outputIndexes": [ 2564 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2564 ] , "main_type": "NONE", "name": "Shape3784", "outputIndexes": [ 2565 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2564 ] , "main_type": "NONE", "name": "Rank3786", "outputIndexes": [ 2566 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2566, 2566 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3788", "outputIndexes": [ 2567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3789", "outputIndexes": [ 2568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3791", "outputIndexes": [ 2569 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2569 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3792", "outputIndexes": [ 2570 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2565, 2568, 2570, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3795", "outputIndexes": [ 2571 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2571 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3796", "outputIndexes": [ 2572 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2572 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3797", "outputIndexes": [ 2573 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2573, 2572 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3798", "outputIndexes": [ 2574 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2564, 2574, 2567 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_2_output_0", "outputIndexes": [ 2575 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2575, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Div_output_0", "outputIndexes": [ 2576 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2576, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2577 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562, 2577, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_1_output_0", "outputIndexes": [ 2578 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.28/self_attn/Neg_output_0", "outputIndexes": [ 2579 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2576, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2580 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562, 20, 2580, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_output_0", "outputIndexes": [ 2581 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2579, 2581 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.28/self_attn/Concat_3_output_0", "outputIndexes": [ 2582 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2582, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_1_output_0", "outputIndexes": [ 2583 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563, 2583 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Add_output_0", "outputIndexes": [ 2584 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3682 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3446444270, 2097174, 262144, 0, 0 ] } , "name": "/layers.28/self_attn/k_proj/Linear", "outputIndexes": [ 3687 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3687 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3688 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3688 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2585 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2586 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2559, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2587 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2586, 2587, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_1_output_0", "outputIndexes": [ 2588 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2585, 2588 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_1_output_0", "outputIndexes": [ 2589 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_2_output_0", "outputIndexes": [ 2590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589 ] , "main_type": "NONE", "name": "/blocks.28/self_attn/Shape_3_output_0", "outputIndexes": [ 2591 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2591 ] , "main_type": "NONE", "name": "Shape3817", "outputIndexes": [ 2592 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2591 ] , "main_type": "NONE", "name": "Rank3819", "outputIndexes": [ 2593 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2593, 2593 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3821", "outputIndexes": [ 2594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3822", "outputIndexes": [ 2595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3824", "outputIndexes": [ 2596 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2596 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3825", "outputIndexes": [ 2597 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592, 2595, 2597, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3828", "outputIndexes": [ 2598 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2598 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3829", "outputIndexes": [ 2599 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2599 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3830", "outputIndexes": [ 2600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2600, 2599 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3831", "outputIndexes": [ 2601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591, 2601, 2594 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.28/self_attn/Gather_3_output_0", "outputIndexes": [ 2602 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Div_1_output_0", "outputIndexes": [ 2603 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2603, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2604 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589, 2604, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_3_output_0", "outputIndexes": [ 2605 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2605 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.28/self_attn/Neg_1_output_0", "outputIndexes": [ 2606 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2603, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589, 20, 2607, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.28/self_attn/Slice_2_output_0", "outputIndexes": [ 2608 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2606, 2608 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.28/self_attn/Concat_4_output_0", "outputIndexes": [ 2609 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2609, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Mul_3_output_0", "outputIndexes": [ 2610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2590, 2610 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/self_attn/Add_1_output_0", "outputIndexes": [ 2611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3682 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3448803588, 2097174, 262144, 0, 0 ] } , "name": "/layers.28/self_attn/v_proj/Linear", "outputIndexes": [ 3691 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3691 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3692 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3692 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2613 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2559, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.28/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2614 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2613, 2614, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.28/self_attn/Concat_2_output_0", "outputIndexes": [ 2615 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2612, 2615 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.28/self_attn/Reshape_2_output_0", "outputIndexes": [ 2616 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2584, 2611, 2616, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.28/self_attn/FusedAttention", "outputIndexes": [ 2617 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3693 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3693 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3694 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3694 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3451162906, 8388630, 1048576, 0, 0 ] } , "name": "/layers.28/self_attn/o_proj/Linear", "outputIndexes": [ 3695 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3695 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3696 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3696 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2618 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2538, 2618 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/Add_output_0", "outputIndexes": [ 2619 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3460600112, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.28/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2620 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2620 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3697 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3697 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3698 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3698 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3460632880, 29360150, 3670016, 0, 0 ] } , "name": "/layers.28/mlp/gate_proj/Linear", "outputIndexes": [ 3699 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3699 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3700 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3700 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2621 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2621 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.28/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2622 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3698 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3493663046, 29360150, 3670016, 0, 0 ] } , "name": "/layers.28/mlp/up_proj/Linear", "outputIndexes": [ 3703 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3703 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3704 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3704 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2623 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622, 2623 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/mlp/Mul_output_0", "outputIndexes": [ 2624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2624 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3705 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3705 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3706 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3706 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3526693212, 29360150, 3670016, 0, 0 ] } , "name": "/layers.28/mlp/down_proj/Linear", "outputIndexes": [ 3707 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3707 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3708 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3708 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2625 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619, 2625 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.28/Add_1_output_0", "outputIndexes": [ 2626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2626, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/Reshape_output_0", "outputIndexes": [ 2627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2627 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3559723378, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.29/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2628 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2628 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3709 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3710 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3710 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3559756146, 8388630, 1048576, 0, 0 ] } , "name": "/layers.29/self_attn/q_proj/Linear", "outputIndexes": [ 3711 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3711 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3712 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3712 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2629 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2628 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_output_0", "outputIndexes": [ 2630 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2630 ] , "main_type": "NONE", "name": "Shape3877", "outputIndexes": [ 2631 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2630 ] , "main_type": "NONE", "name": "Rank3879", "outputIndexes": [ 2632 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2632, 2632 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3881", "outputIndexes": [ 2633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3882", "outputIndexes": [ 2634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3884", "outputIndexes": [ 2635 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3885", "outputIndexes": [ 2636 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2631, 2634, 2636, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3888", "outputIndexes": [ 2637 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3889", "outputIndexes": [ 2638 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2638, 2638 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3891", "outputIndexes": [ 2639 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630, 2639, 2633 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_output_0", "outputIndexes": [ 2640 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2641 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3899", "outputIndexes": [ 2642 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3902", "outputIndexes": [ 2643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2631, 2642, 2643, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3905", "outputIndexes": [ 2644 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2644 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3906", "outputIndexes": [ 2645 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2645 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3907", "outputIndexes": [ 2646 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2646, 2645 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3908", "outputIndexes": [ 2647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630, 2647, 2633 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_1_output_0", "outputIndexes": [ 2648 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2648, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2649 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2641, 2649, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_output_0", "outputIndexes": [ 2650 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629, 2650 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_output_0", "outputIndexes": [ 2651 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_output_0", "outputIndexes": [ 2652 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_2_output_0", "outputIndexes": [ 2653 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2653 ] , "main_type": "NONE", "name": "Shape3915", "outputIndexes": [ 2654 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2653 ] , "main_type": "NONE", "name": "Rank3917", "outputIndexes": [ 2655 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2655, 2655 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3919", "outputIndexes": [ 2656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3920", "outputIndexes": [ 2657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3922", "outputIndexes": [ 2658 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2658 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3923", "outputIndexes": [ 2659 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2654, 2657, 2659, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3926", "outputIndexes": [ 2660 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2660 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3927", "outputIndexes": [ 2661 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2661 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3928", "outputIndexes": [ 2662 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2662, 2661 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3929", "outputIndexes": [ 2663 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653, 2663, 2656 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_2_output_0", "outputIndexes": [ 2664 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2664, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Div_output_0", "outputIndexes": [ 2665 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2665, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2666 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651, 2666, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_1_output_0", "outputIndexes": [ 2667 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2667 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.29/self_attn/Neg_output_0", "outputIndexes": [ 2668 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2665, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2669 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651, 20, 2669, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_output_0", "outputIndexes": [ 2670 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2668, 2670 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.29/self_attn/Concat_3_output_0", "outputIndexes": [ 2671 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2671, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_1_output_0", "outputIndexes": [ 2672 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2652, 2672 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Add_output_0", "outputIndexes": [ 2673 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3710 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3569193352, 2097174, 262144, 0, 0 ] } , "name": "/layers.29/self_attn/k_proj/Linear", "outputIndexes": [ 3715 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3715 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3716 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3716 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2674 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2675 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2648, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2676 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2675, 2676, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_1_output_0", "outputIndexes": [ 2677 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2674, 2677 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_1_output_0", "outputIndexes": [ 2678 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_2_output_0", "outputIndexes": [ 2679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678 ] , "main_type": "NONE", "name": "/blocks.29/self_attn/Shape_3_output_0", "outputIndexes": [ 2680 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2680 ] , "main_type": "NONE", "name": "Shape3948", "outputIndexes": [ 2681 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2680 ] , "main_type": "NONE", "name": "Rank3950", "outputIndexes": [ 2682 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682, 2682 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3952", "outputIndexes": [ 2683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2683 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3953", "outputIndexes": [ 2684 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2683, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3955", "outputIndexes": [ 2685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2685 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3956", "outputIndexes": [ 2686 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2681, 2684, 2686, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3959", "outputIndexes": [ 2687 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3960", "outputIndexes": [ 2688 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2688 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3961", "outputIndexes": [ 2689 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2689, 2688 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3962", "outputIndexes": [ 2690 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680, 2690, 2683 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.29/self_attn/Gather_3_output_0", "outputIndexes": [ 2691 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Div_1_output_0", "outputIndexes": [ 2692 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2692, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2693 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678, 2693, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_3_output_0", "outputIndexes": [ 2694 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2694 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.29/self_attn/Neg_1_output_0", "outputIndexes": [ 2695 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2692, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2696 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678, 20, 2696, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.29/self_attn/Slice_2_output_0", "outputIndexes": [ 2697 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2695, 2697 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.29/self_attn/Concat_4_output_0", "outputIndexes": [ 2698 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2698, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Mul_3_output_0", "outputIndexes": [ 2699 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2679, 2699 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/self_attn/Add_1_output_0", "outputIndexes": [ 2700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3710 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3571552670, 2097174, 262144, 0, 0 ] } , "name": "/layers.29/self_attn/v_proj/Linear", "outputIndexes": [ 3719 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3719 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3720 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3720 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2701 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2702 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2648, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.29/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2703 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2702, 2703, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.29/self_attn/Concat_2_output_0", "outputIndexes": [ 2704 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2701, 2704 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.29/self_attn/Reshape_2_output_0", "outputIndexes": [ 2705 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2673, 2700, 2705, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.29/self_attn/FusedAttention", "outputIndexes": [ 2706 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2706 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3721 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3721 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3722 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3722 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3573911988, 8388630, 1048576, 0, 0 ] } , "name": "/layers.29/self_attn/o_proj/Linear", "outputIndexes": [ 3723 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3723 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3724 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3724 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2707 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2627, 2707 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/Add_output_0", "outputIndexes": [ 2708 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3583349194, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.29/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2709 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2709 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3725 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3725 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3726 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3726 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3583381962, 29360150, 3670016, 0, 0 ] } , "name": "/layers.29/mlp/gate_proj/Linear", "outputIndexes": [ 3727 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3727 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3728 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3728 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2710 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.29/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2711 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3726 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3616412128, 29360150, 3670016, 0, 0 ] } , "name": "/layers.29/mlp/up_proj/Linear", "outputIndexes": [ 3731 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3731 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3732 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3732 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2712 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2711, 2712 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/mlp/Mul_output_0", "outputIndexes": [ 2713 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3733 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3734 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3734 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3649442294, 29360150, 3670016, 0, 0 ] } , "name": "/layers.29/mlp/down_proj/Linear", "outputIndexes": [ 3735 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3735 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3736 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3736 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2714 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708, 2714 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.29/Add_1_output_0", "outputIndexes": [ 2715 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/Reshape_output_0", "outputIndexes": [ 2716 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2716 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3682472460, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.30/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2717 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3737 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3737 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3738 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3738 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3682505228, 8388630, 1048576, 0, 0 ] } , "name": "/layers.30/self_attn/q_proj/Linear", "outputIndexes": [ 3739 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3739 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3740 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3740 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2718 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_output_0", "outputIndexes": [ 2719 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2719 ] , "main_type": "NONE", "name": "Shape4008", "outputIndexes": [ 2720 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2719 ] , "main_type": "NONE", "name": "Rank4010", "outputIndexes": [ 2721 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2721, 2721 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4012", "outputIndexes": [ 2722 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4013", "outputIndexes": [ 2723 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4015", "outputIndexes": [ 2724 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4016", "outputIndexes": [ 2725 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720, 2723, 2725, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4019", "outputIndexes": [ 2726 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4020", "outputIndexes": [ 2727 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2727, 2727 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4022", "outputIndexes": [ 2728 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719, 2728, 2722 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_output_0", "outputIndexes": [ 2729 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2729, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2730 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4030", "outputIndexes": [ 2731 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4033", "outputIndexes": [ 2732 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720, 2731, 2732, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4036", "outputIndexes": [ 2733 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2733 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4037", "outputIndexes": [ 2734 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2734 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4038", "outputIndexes": [ 2735 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735, 2734 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4039", "outputIndexes": [ 2736 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719, 2736, 2722 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_1_output_0", "outputIndexes": [ 2737 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2738 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2730, 2738, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_output_0", "outputIndexes": [ 2739 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2718, 2739 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_output_0", "outputIndexes": [ 2740 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_output_0", "outputIndexes": [ 2741 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_2_output_0", "outputIndexes": [ 2742 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2742 ] , "main_type": "NONE", "name": "Shape4046", "outputIndexes": [ 2743 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2742 ] , "main_type": "NONE", "name": "Rank4048", "outputIndexes": [ 2744 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2744, 2744 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4050", "outputIndexes": [ 2745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4051", "outputIndexes": [ 2746 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2745, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4053", "outputIndexes": [ 2747 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4054", "outputIndexes": [ 2748 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2743, 2746, 2748, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4057", "outputIndexes": [ 2749 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4058", "outputIndexes": [ 2750 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2750 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4059", "outputIndexes": [ 2751 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2751, 2750 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4060", "outputIndexes": [ 2752 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742, 2752, 2745 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_2_output_0", "outputIndexes": [ 2753 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2753, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Div_output_0", "outputIndexes": [ 2754 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2754, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2755 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740, 2755, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_1_output_0", "outputIndexes": [ 2756 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2756 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.30/self_attn/Neg_output_0", "outputIndexes": [ 2757 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2754, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2758 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740, 20, 2758, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_output_0", "outputIndexes": [ 2759 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2757, 2759 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.30/self_attn/Concat_3_output_0", "outputIndexes": [ 2760 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2760, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_1_output_0", "outputIndexes": [ 2761 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2741, 2761 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Add_output_0", "outputIndexes": [ 2762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3738 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3691942434, 2097174, 262144, 0, 0 ] } , "name": "/layers.30/self_attn/k_proj/Linear", "outputIndexes": [ 3743 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3743 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3744 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3744 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2763 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2729, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2764 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2765 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764, 2765, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_1_output_0", "outputIndexes": [ 2766 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2763, 2766 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_1_output_0", "outputIndexes": [ 2767 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2767, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_2_output_0", "outputIndexes": [ 2768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2767 ] , "main_type": "NONE", "name": "/blocks.30/self_attn/Shape_3_output_0", "outputIndexes": [ 2769 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2769 ] , "main_type": "NONE", "name": "Shape4079", "outputIndexes": [ 2770 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2769 ] , "main_type": "NONE", "name": "Rank4081", "outputIndexes": [ 2771 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2771, 2771 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4083", "outputIndexes": [ 2772 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2772 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4084", "outputIndexes": [ 2773 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2772, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4086", "outputIndexes": [ 2774 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2774 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4087", "outputIndexes": [ 2775 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2770, 2773, 2775, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4090", "outputIndexes": [ 2776 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2776 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4091", "outputIndexes": [ 2777 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2777 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4092", "outputIndexes": [ 2778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2778, 2777 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4093", "outputIndexes": [ 2779 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 2779, 2772 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.30/self_attn/Gather_3_output_0", "outputIndexes": [ 2780 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2780, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Div_1_output_0", "outputIndexes": [ 2781 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2781, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2782 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2767, 2782, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_3_output_0", "outputIndexes": [ 2783 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2783 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.30/self_attn/Neg_1_output_0", "outputIndexes": [ 2784 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2781, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2785 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2767, 20, 2785, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.30/self_attn/Slice_2_output_0", "outputIndexes": [ 2786 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2784, 2786 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.30/self_attn/Concat_4_output_0", "outputIndexes": [ 2787 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2787, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Mul_3_output_0", "outputIndexes": [ 2788 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2768, 2788 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/self_attn/Add_1_output_0", "outputIndexes": [ 2789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3738 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3694301752, 2097174, 262144, 0, 0 ] } , "name": "/layers.30/self_attn/v_proj/Linear", "outputIndexes": [ 3747 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3747 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3748 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3748 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2790 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2729, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2791 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.30/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2792 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2791, 2792, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.30/self_attn/Concat_2_output_0", "outputIndexes": [ 2793 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2790, 2793 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.30/self_attn/Reshape_2_output_0", "outputIndexes": [ 2794 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2762, 2789, 2794, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.30/self_attn/FusedAttention", "outputIndexes": [ 2795 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2795 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3749 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3750 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3750 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3696661070, 8388630, 1048576, 0, 0 ] } , "name": "/layers.30/self_attn/o_proj/Linear", "outputIndexes": [ 3751 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3751 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3752 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3752 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2796 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2716, 2796 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/Add_output_0", "outputIndexes": [ 2797 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3706098276, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.30/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2798 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2798 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3753 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3754 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3754 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3706131044, 29360150, 3670016, 0, 0 ] } , "name": "/layers.30/mlp/gate_proj/Linear", "outputIndexes": [ 3755 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3755 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3756 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3756 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2799 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.30/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2800 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3754 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3739161210, 29360150, 3670016, 0, 0 ] } , "name": "/layers.30/mlp/up_proj/Linear", "outputIndexes": [ 3759 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3759 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3760 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3760 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2801 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2800, 2801 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/mlp/Mul_output_0", "outputIndexes": [ 2802 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2802 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3761 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3761 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3762 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3762 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3772191376, 29360150, 3670016, 0, 0 ] } , "name": "/layers.30/mlp/down_proj/Linear", "outputIndexes": [ 3763 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3763 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3764 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3764 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2803 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797, 2803 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.30/Add_1_output_0", "outputIndexes": [ 2804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2804, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/Reshape_output_0", "outputIndexes": [ 2805 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2805 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3805221542, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.31/input_layernorm/Mul_1_output_0", "outputIndexes": [ 2806 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3765 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3765 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3766 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3766 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3805254310, 8388630, 1048576, 0, 0 ] } , "name": "/layers.31/self_attn/q_proj/Linear", "outputIndexes": [ 3767 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3767 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3768 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3768 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2807 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_output_0", "outputIndexes": [ 2808 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2808 ] , "main_type": "NONE", "name": "Shape4139", "outputIndexes": [ 2809 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2808 ] , "main_type": "NONE", "name": "Rank4141", "outputIndexes": [ 2810 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810, 2810 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4143", "outputIndexes": [ 2811 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2811 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4144", "outputIndexes": [ 2812 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2811, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4146", "outputIndexes": [ 2813 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4147", "outputIndexes": [ 2814 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2809, 2812, 2814, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4150", "outputIndexes": [ 2815 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4151", "outputIndexes": [ 2816 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2816, 2816 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4153", "outputIndexes": [ 2817 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808, 2817, 2811 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_output_0", "outputIndexes": [ 2818 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2818, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_output_0", "outputIndexes": [ 2819 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2811 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4161", "outputIndexes": [ 2820 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4164", "outputIndexes": [ 2821 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2809, 2820, 2821, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4167", "outputIndexes": [ 2822 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2822 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4168", "outputIndexes": [ 2823 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2823 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4169", "outputIndexes": [ 2824 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2824, 2823 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4170", "outputIndexes": [ 2825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808, 2825, 2811 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_1_output_0", "outputIndexes": [ 2826 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_1_output_0", "outputIndexes": [ 2827 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819, 2827, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_output_0", "outputIndexes": [ 2828 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2807, 2828 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_output_0", "outputIndexes": [ 2829 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_output_0", "outputIndexes": [ 2830 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_2_output_0", "outputIndexes": [ 2831 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2831 ] , "main_type": "NONE", "name": "Shape4177", "outputIndexes": [ 2832 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2831 ] , "main_type": "NONE", "name": "Rank4179", "outputIndexes": [ 2833 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2833, 2833 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4181", "outputIndexes": [ 2834 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4182", "outputIndexes": [ 2835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2834, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4184", "outputIndexes": [ 2836 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2836 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4185", "outputIndexes": [ 2837 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2832, 2835, 2837, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4188", "outputIndexes": [ 2838 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2838 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4189", "outputIndexes": [ 2839 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2839 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4190", "outputIndexes": [ 2840 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2840, 2839 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4191", "outputIndexes": [ 2841 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831, 2841, 2834 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_2_output_0", "outputIndexes": [ 2842 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2842, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Div_output_0", "outputIndexes": [ 2843 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2843, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_7_output_0", "outputIndexes": [ 2844 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829, 2844, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_1_output_0", "outputIndexes": [ 2845 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.31/self_attn/Neg_output_0", "outputIndexes": [ 2846 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2843, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_6_output_0", "outputIndexes": [ 2847 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829, 20, 2847, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_output_0", "outputIndexes": [ 2848 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2846, 2848 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.31/self_attn/Concat_3_output_0", "outputIndexes": [ 2849 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2849, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_1_output_0", "outputIndexes": [ 2850 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2830, 2850 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Add_output_0", "outputIndexes": [ 2851 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3766 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3814691516, 2097174, 262144, 0, 0 ] } , "name": "/layers.31/self_attn/k_proj/Linear", "outputIndexes": [ 3771 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3771 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3772 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3772 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2852 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2818, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_2_output_0", "outputIndexes": [ 2853 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_3_output_0", "outputIndexes": [ 2854 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2853, 2854, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_1_output_0", "outputIndexes": [ 2855 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2852, 2855 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_1_output_0", "outputIndexes": [ 2856 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856, 57 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_2_output_0", "outputIndexes": [ 2857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856 ] , "main_type": "NONE", "name": "/blocks.31/self_attn/Shape_3_output_0", "outputIndexes": [ 2858 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2858 ] , "main_type": "NONE", "name": "Shape4210", "outputIndexes": [ 2859 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2858 ] , "main_type": "NONE", "name": "Rank4212", "outputIndexes": [ 2860 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2860, 2860 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4214", "outputIndexes": [ 2861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4215", "outputIndexes": [ 2862 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861, 12 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4217", "outputIndexes": [ 2863 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2863 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4218", "outputIndexes": [ 2864 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2859, 2862, 2864, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4221", "outputIndexes": [ 2865 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2865 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4222", "outputIndexes": [ 2866 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 2866 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4223", "outputIndexes": [ 2867 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2867, 2866 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4224", "outputIndexes": [ 2868 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858, 2868, 2861 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/blocks.31/self_attn/Gather_3_output_0", "outputIndexes": [ 2869 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2869, 72 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Div_1_output_0", "outputIndexes": [ 2870 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2870, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_9_output_0", "outputIndexes": [ 2871 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856, 2871, 75, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_3_output_0", "outputIndexes": [ 2872 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2872 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/blocks.31/self_attn/Neg_1_output_0", "outputIndexes": [ 2873 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2870, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_8_output_0", "outputIndexes": [ 2874 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856, 20, 2874, 76, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/blocks.31/self_attn/Slice_2_output_0", "outputIndexes": [ 2875 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2873, 2875 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/blocks.31/self_attn/Concat_4_output_0", "outputIndexes": [ 2876 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2876, 88 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Mul_3_output_0", "outputIndexes": [ 2877 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2857, 2877 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/self_attn/Add_1_output_0", "outputIndexes": [ 2878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3766 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 32768, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3817050834, 2097174, 262144, 0, 0 ] } , "name": "/layers.31/self_attn/v_proj/Linear", "outputIndexes": [ 3775 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3775 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3776 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3776 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2879 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2818, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_4_output_0", "outputIndexes": [ 2880 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/blocks.31/self_attn/Unsqueeze_5_output_0", "outputIndexes": [ 2881 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2880, 2881, 94, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/blocks.31/self_attn/Concat_2_output_0", "outputIndexes": [ 2882 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2879, 2882 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/blocks.31/self_attn/Reshape_2_output_0", "outputIndexes": [ 2883 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2851, 2878, 2883, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "/layers.31/self_attn/FusedAttention", "outputIndexes": [ 2884 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2884 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3777 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3777 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3778 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3778 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 131072, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3819410152, 8388630, 1048576, 0, 0 ] } , "name": "/layers.31/self_attn/o_proj/Linear", "outputIndexes": [ 3779 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3779 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3780 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3780 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2885 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2805, 2885 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/Add_output_0", "outputIndexes": [ 2886 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2886 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3828847358, 16384, 16384 ] , "useRMSNorm": true } , "name": "/blocks.31/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 2887 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2887 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3781 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3781 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3782 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3782 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3828880126, 29360150, 3670016, 0, 0 ] } , "name": "/layers.31/mlp/gate_proj/Linear", "outputIndexes": [ 3783 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3783 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3784 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3784 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2888 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2888 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/blocks.31/mlp/act_fn/Mul_output_0", "outputIndexes": [ 2889 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3782 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 14336, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3861910292, 29360150, 3670016, 0, 0 ] } , "name": "/layers.31/mlp/up_proj/Linear", "outputIndexes": [ 3787 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3787 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3788 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3788 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 14336 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2890 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2889, 2890 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/mlp/Mul_output_0", "outputIndexes": [ 2891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2891 ] , "main_type": "Reshape", "main": { "dims": [ -1, 14336, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3789 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3789 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3790 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3790 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 14336, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 458752, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3894940458, 29360150, 3670016, 0, 0 ] } , "name": "/layers.31/mlp/down_proj/Linear", "outputIndexes": [ 3791 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3791 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3792 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3792 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2892 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2886, 2892 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/blocks.31/Add_1_output_0", "outputIndexes": [ 2893 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2893, 1, 75, 15, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_output_0", "outputIndexes": [ 2894 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2894 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3927970624, 16384, 16384 ] , "useRMSNorm": true } , "name": "hidden_states", "outputIndexes": [ 2895 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2895 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": [ 3793 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": [ 3794 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3794 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128256, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4104192, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } , "external": [ 3928003392, 262668314, 32833536, 0, 0 ] } , "name": "/lm/lm_head/Linear", "outputIndexes": [ 3795 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3795 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": [ 3796 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3796 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128256 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": [ 2896 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } ] , "outputName": [ "logits", "hidden_states" ] , "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": [ "position_ids", "logits_index", "input_ids", "/blocks.0/Constant_output_0", "/blocks.0/Reshape_output_0", "/blocks.0/input_layernorm/Mul_1_output_0", "/blocks.0/self_attn/q_proj/FakeLinear_output_0", "/blocks.0/self_attn/Shape_output_0", "Shape21", "Rank23", "BinaryOp25", "Unsqueeze26", "Const27", "BinaryOp28", "Unsqueeze29", "Unsqueeze31", "StridedSlice32", "Squeeze33", "BinaryOp35", "/blocks.0/self_attn/Gather_output_0", "/rotary/Constant_3_output_0", "/blocks.0/self_attn/Unsqueeze_output_0", "Unsqueeze45", "Unsqueeze48", "StridedSlice51", "Squeeze52", "BinaryOp53", "BinaryOp54", "/blocks.0/self_attn/Gather_1_output_0", "/blocks.0/self_attn/Unsqueeze_1_output_0", "/blocks.0/self_attn/Constant_2_output_0", "/blocks.0/self_attn/Constant_3_output_0", "/blocks.0/self_attn/Concat_output_0", "/blocks.0/self_attn/Reshape_output_0", "/rotary/Cast_output_0", "/rotary/Constant_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_1_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_5_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape76", "Rank78", "BinaryOp80", "Unsqueeze81", "BinaryOp83", "Unsqueeze84", "StridedSlice87", "Squeeze88", "BinaryOp90", "/blocks.0/self_attn/Gather_2_output_0", "/blocks.0/self_attn/Mul_output_0", "/blocks.0/self_attn/Shape_2_output_0", "/blocks.0/self_attn/Constant_8_output_0", "Shape95", "Rank97", "BinaryOp99", "Unsqueeze100", "BinaryOp102", "Unsqueeze103", "StridedSlice106", "Squeeze107", "BinaryOp108", "BinaryOp109", "/blocks.0/self_attn/Gather_4_output_0", "/blocks.0/self_attn/Constant_9_output_0", "/blocks.0/self_attn/Div_output_0", "/blocks.0/self_attn/Unsqueeze_7_output_0", "/blocks.0/self_attn/Constant_16_output_0", "/blocks.0/self_attn/Constant_10_output_0", "/blocks.0/self_attn/Slice_1_output_0", "/blocks.0/self_attn/Neg_output_0", "/blocks.0/self_attn/Unsqueeze_6_output_0", "/blocks.0/self_attn/Slice_output_0", "/blocks.0/self_attn/Concat_3_output_0", "Unsqueeze127", "Unsqueeze130", "StridedSlice133", "Squeeze134", "BinaryOp135", "BinaryOp136", "/blocks.0/self_attn/Gather_3_output_0", "/blocks.0/self_attn/Mul_1_output_0", "/blocks.0/self_attn/Add_output_0", "/blocks.0/self_attn/k_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_2_output_0", "/blocks.0/self_attn/Unsqueeze_3_output_0", "/blocks.0/self_attn/Constant_4_output_0", "/blocks.0/self_attn/Concat_1_output_0", "/blocks.0/self_attn/Reshape_1_output_0", "/blocks.0/self_attn/Mul_2_output_0", "/blocks.0/self_attn/Shape_3_output_0", "Shape148", "Rank150", "BinaryOp152", "Unsqueeze153", "BinaryOp155", "Unsqueeze156", "StridedSlice159", "Squeeze160", "BinaryOp161", "BinaryOp162", "/blocks.0/self_attn/Gather_5_output_0", "/blocks.0/self_attn/Div_1_output_0", "/blocks.0/self_attn/Unsqueeze_9_output_0", "/blocks.0/self_attn/Slice_3_output_0", "/blocks.0/self_attn/Neg_1_output_0", "/blocks.0/self_attn/Unsqueeze_8_output_0", "/blocks.0/self_attn/Slice_2_output_0", "/blocks.0/self_attn/Concat_4_output_0", "/blocks.0/self_attn/Mul_3_output_0", "/blocks.0/self_attn/Add_1_output_0", "/blocks.0/self_attn/v_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_4_output_0", "/blocks.0/self_attn/Unsqueeze_5_output_0", "/blocks.0/self_attn/Concat_2_output_0", "/blocks.0/self_attn/Reshape_2_output_0", "attention_mask", "/blocks.0/self_attn/fused_attn/FusedAttention_output_0", "/blocks.0/self_attn/o_proj/FakeLinear_output_0", "/blocks.0/Add_output_0", "/blocks.0/post_attention_layernorm/Mul_1_output_0", "/blocks.0/mlp/gate_proj/FakeLinear_output_0", "/blocks.0/mlp/act_fn/Mul_output_0", "/blocks.0/mlp/up_proj/FakeLinear_output_0", "/blocks.0/mlp/Mul_output_0", "/blocks.0/mlp/down_proj/FakeLinear_output_0", "/blocks.0/Add_1_output_0", "/blocks.1/Reshape_output_0", "/blocks.1/input_layernorm/Mul_1_output_0", "/blocks.1/self_attn/q_proj/FakeLinear_output_0", "/blocks.1/self_attn/Shape_output_0", "Shape209", "Rank211", "BinaryOp213", "Unsqueeze214", "BinaryOp216", "Unsqueeze217", "StridedSlice220", "Squeeze221", "BinaryOp223", "/blocks.1/self_attn/Gather_output_0", "/blocks.1/self_attn/Unsqueeze_output_0", "Unsqueeze231", "Unsqueeze234", "StridedSlice237", "Squeeze238", "BinaryOp239", "BinaryOp240", "/blocks.1/self_attn/Gather_1_output_0", "/blocks.1/self_attn/Unsqueeze_1_output_0", "/blocks.1/self_attn/Concat_output_0", "/blocks.1/self_attn/Reshape_output_0", "/blocks.1/self_attn/Mul_output_0", "/blocks.1/self_attn/Shape_2_output_0", "Shape247", "Rank249", "BinaryOp251", "Unsqueeze252", "BinaryOp254", "Unsqueeze255", "StridedSlice258", "Squeeze259", "BinaryOp260", "BinaryOp261", "/blocks.1/self_attn/Gather_2_output_0", "/blocks.1/self_attn/Div_output_0", "/blocks.1/self_attn/Unsqueeze_7_output_0", "/blocks.1/self_attn/Slice_1_output_0", "/blocks.1/self_attn/Neg_output_0", "/blocks.1/self_attn/Unsqueeze_6_output_0", "/blocks.1/self_attn/Slice_output_0", "/blocks.1/self_attn/Concat_3_output_0", "/blocks.1/self_attn/Mul_1_output_0", "/blocks.1/self_attn/Add_output_0", "/blocks.1/self_attn/k_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_2_output_0", "/blocks.1/self_attn/Unsqueeze_3_output_0", "/blocks.1/self_attn/Concat_1_output_0", "/blocks.1/self_attn/Reshape_1_output_0", "/blocks.1/self_attn/Mul_2_output_0", "/blocks.1/self_attn/Shape_3_output_0", "Shape280", "Rank282", "BinaryOp284", "Unsqueeze285", "BinaryOp287", "Unsqueeze288", "StridedSlice291", "Squeeze292", "BinaryOp293", "BinaryOp294", "/blocks.1/self_attn/Gather_3_output_0", "/blocks.1/self_attn/Div_1_output_0", "/blocks.1/self_attn/Unsqueeze_9_output_0", "/blocks.1/self_attn/Slice_3_output_0", "/blocks.1/self_attn/Neg_1_output_0", "/blocks.1/self_attn/Unsqueeze_8_output_0", "/blocks.1/self_attn/Slice_2_output_0", "/blocks.1/self_attn/Concat_4_output_0", "/blocks.1/self_attn/Mul_3_output_0", "/blocks.1/self_attn/Add_1_output_0", "/blocks.1/self_attn/v_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_4_output_0", "/blocks.1/self_attn/Unsqueeze_5_output_0", "/blocks.1/self_attn/Concat_2_output_0", "/blocks.1/self_attn/Reshape_2_output_0", "/blocks.1/self_attn/fused_attn/FusedAttention_output_0", "/blocks.1/self_attn/o_proj/FakeLinear_output_0", "/blocks.1/Add_output_0", "/blocks.1/post_attention_layernorm/Mul_1_output_0", "/blocks.1/mlp/gate_proj/FakeLinear_output_0", "/blocks.1/mlp/act_fn/Mul_output_0", "/blocks.1/mlp/up_proj/FakeLinear_output_0", "/blocks.1/mlp/Mul_output_0", "/blocks.1/mlp/down_proj/FakeLinear_output_0", "/blocks.1/Add_1_output_0", "/blocks.2/Reshape_output_0", "/blocks.2/input_layernorm/Mul_1_output_0", "/blocks.2/self_attn/q_proj/FakeLinear_output_0", "/blocks.2/self_attn/Shape_output_0", "Shape340", "Rank342", "BinaryOp344", "Unsqueeze345", "BinaryOp347", "Unsqueeze348", "StridedSlice351", "Squeeze352", "BinaryOp354", "/blocks.2/self_attn/Gather_output_0", "/blocks.2/self_attn/Unsqueeze_output_0", "Unsqueeze362", "Unsqueeze365", "StridedSlice368", "Squeeze369", "BinaryOp370", "BinaryOp371", "/blocks.2/self_attn/Gather_1_output_0", "/blocks.2/self_attn/Unsqueeze_1_output_0", "/blocks.2/self_attn/Concat_output_0", "/blocks.2/self_attn/Reshape_output_0", "/blocks.2/self_attn/Mul_output_0", "/blocks.2/self_attn/Shape_2_output_0", "Shape378", "Rank380", "BinaryOp382", "Unsqueeze383", "BinaryOp385", "Unsqueeze386", "StridedSlice389", "Squeeze390", "BinaryOp391", "BinaryOp392", "/blocks.2/self_attn/Gather_2_output_0", "/blocks.2/self_attn/Div_output_0", "/blocks.2/self_attn/Unsqueeze_7_output_0", "/blocks.2/self_attn/Slice_1_output_0", "/blocks.2/self_attn/Neg_output_0", "/blocks.2/self_attn/Unsqueeze_6_output_0", "/blocks.2/self_attn/Slice_output_0", "/blocks.2/self_attn/Concat_3_output_0", "/blocks.2/self_attn/Mul_1_output_0", "/blocks.2/self_attn/Add_output_0", "/blocks.2/self_attn/k_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_2_output_0", "/blocks.2/self_attn/Unsqueeze_3_output_0", "/blocks.2/self_attn/Concat_1_output_0", "/blocks.2/self_attn/Reshape_1_output_0", "/blocks.2/self_attn/Mul_2_output_0", "/blocks.2/self_attn/Shape_3_output_0", "Shape411", "Rank413", "BinaryOp415", "Unsqueeze416", "BinaryOp418", "Unsqueeze419", "StridedSlice422", "Squeeze423", "BinaryOp424", "BinaryOp425", "/blocks.2/self_attn/Gather_3_output_0", "/blocks.2/self_attn/Div_1_output_0", "/blocks.2/self_attn/Unsqueeze_9_output_0", "/blocks.2/self_attn/Slice_3_output_0", "/blocks.2/self_attn/Neg_1_output_0", "/blocks.2/self_attn/Unsqueeze_8_output_0", "/blocks.2/self_attn/Slice_2_output_0", "/blocks.2/self_attn/Concat_4_output_0", "/blocks.2/self_attn/Mul_3_output_0", "/blocks.2/self_attn/Add_1_output_0", "/blocks.2/self_attn/v_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_4_output_0", "/blocks.2/self_attn/Unsqueeze_5_output_0", "/blocks.2/self_attn/Concat_2_output_0", "/blocks.2/self_attn/Reshape_2_output_0", "/blocks.2/self_attn/fused_attn/FusedAttention_output_0", "/blocks.2/self_attn/o_proj/FakeLinear_output_0", "/blocks.2/Add_output_0", "/blocks.2/post_attention_layernorm/Mul_1_output_0", "/blocks.2/mlp/gate_proj/FakeLinear_output_0", "/blocks.2/mlp/act_fn/Mul_output_0", "/blocks.2/mlp/up_proj/FakeLinear_output_0", "/blocks.2/mlp/Mul_output_0", "/blocks.2/mlp/down_proj/FakeLinear_output_0", "/blocks.2/Add_1_output_0", "/blocks.3/Reshape_output_0", "/blocks.3/input_layernorm/Mul_1_output_0", "/blocks.3/self_attn/q_proj/FakeLinear_output_0", "/blocks.3/self_attn/Shape_output_0", "Shape471", "Rank473", "BinaryOp475", "Unsqueeze476", "BinaryOp478", "Unsqueeze479", "StridedSlice482", "Squeeze483", "BinaryOp485", "/blocks.3/self_attn/Gather_output_0", "/blocks.3/self_attn/Unsqueeze_output_0", "Unsqueeze493", "Unsqueeze496", "StridedSlice499", "Squeeze500", "BinaryOp501", "BinaryOp502", "/blocks.3/self_attn/Gather_1_output_0", "/blocks.3/self_attn/Unsqueeze_1_output_0", "/blocks.3/self_attn/Concat_output_0", "/blocks.3/self_attn/Reshape_output_0", "/blocks.3/self_attn/Mul_output_0", "/blocks.3/self_attn/Shape_2_output_0", "Shape509", "Rank511", "BinaryOp513", "Unsqueeze514", "BinaryOp516", "Unsqueeze517", "StridedSlice520", "Squeeze521", "BinaryOp522", "BinaryOp523", "/blocks.3/self_attn/Gather_2_output_0", "/blocks.3/self_attn/Div_output_0", "/blocks.3/self_attn/Unsqueeze_7_output_0", "/blocks.3/self_attn/Slice_1_output_0", "/blocks.3/self_attn/Neg_output_0", "/blocks.3/self_attn/Unsqueeze_6_output_0", "/blocks.3/self_attn/Slice_output_0", "/blocks.3/self_attn/Concat_3_output_0", "/blocks.3/self_attn/Mul_1_output_0", "/blocks.3/self_attn/Add_output_0", "/blocks.3/self_attn/k_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_2_output_0", "/blocks.3/self_attn/Unsqueeze_3_output_0", "/blocks.3/self_attn/Concat_1_output_0", "/blocks.3/self_attn/Reshape_1_output_0", "/blocks.3/self_attn/Mul_2_output_0", "/blocks.3/self_attn/Shape_3_output_0", "Shape542", "Rank544", "BinaryOp546", "Unsqueeze547", "BinaryOp549", "Unsqueeze550", "StridedSlice553", "Squeeze554", "BinaryOp555", "BinaryOp556", "/blocks.3/self_attn/Gather_3_output_0", "/blocks.3/self_attn/Div_1_output_0", "/blocks.3/self_attn/Unsqueeze_9_output_0", "/blocks.3/self_attn/Slice_3_output_0", "/blocks.3/self_attn/Neg_1_output_0", "/blocks.3/self_attn/Unsqueeze_8_output_0", "/blocks.3/self_attn/Slice_2_output_0", "/blocks.3/self_attn/Concat_4_output_0", "/blocks.3/self_attn/Mul_3_output_0", "/blocks.3/self_attn/Add_1_output_0", "/blocks.3/self_attn/v_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_4_output_0", "/blocks.3/self_attn/Unsqueeze_5_output_0", "/blocks.3/self_attn/Concat_2_output_0", "/blocks.3/self_attn/Reshape_2_output_0", "/blocks.3/self_attn/fused_attn/FusedAttention_output_0", "/blocks.3/self_attn/o_proj/FakeLinear_output_0", "/blocks.3/Add_output_0", "/blocks.3/post_attention_layernorm/Mul_1_output_0", "/blocks.3/mlp/gate_proj/FakeLinear_output_0", "/blocks.3/mlp/act_fn/Mul_output_0", "/blocks.3/mlp/up_proj/FakeLinear_output_0", "/blocks.3/mlp/Mul_output_0", "/blocks.3/mlp/down_proj/FakeLinear_output_0", "/blocks.3/Add_1_output_0", "/blocks.4/Reshape_output_0", "/blocks.4/input_layernorm/Mul_1_output_0", "/blocks.4/self_attn/q_proj/FakeLinear_output_0", "/blocks.4/self_attn/Shape_output_0", "Shape602", "Rank604", "BinaryOp606", "Unsqueeze607", "BinaryOp609", "Unsqueeze610", "StridedSlice613", "Squeeze614", "BinaryOp616", "/blocks.4/self_attn/Gather_output_0", "/blocks.4/self_attn/Unsqueeze_output_0", "Unsqueeze624", "Unsqueeze627", "StridedSlice630", "Squeeze631", "BinaryOp632", "BinaryOp633", "/blocks.4/self_attn/Gather_1_output_0", "/blocks.4/self_attn/Unsqueeze_1_output_0", "/blocks.4/self_attn/Concat_output_0", "/blocks.4/self_attn/Reshape_output_0", "/blocks.4/self_attn/Mul_output_0", "/blocks.4/self_attn/Shape_2_output_0", "Shape640", "Rank642", "BinaryOp644", "Unsqueeze645", "BinaryOp647", "Unsqueeze648", "StridedSlice651", "Squeeze652", "BinaryOp653", "BinaryOp654", "/blocks.4/self_attn/Gather_2_output_0", "/blocks.4/self_attn/Div_output_0", "/blocks.4/self_attn/Unsqueeze_7_output_0", "/blocks.4/self_attn/Slice_1_output_0", "/blocks.4/self_attn/Neg_output_0", "/blocks.4/self_attn/Unsqueeze_6_output_0", "/blocks.4/self_attn/Slice_output_0", "/blocks.4/self_attn/Concat_3_output_0", "/blocks.4/self_attn/Mul_1_output_0", "/blocks.4/self_attn/Add_output_0", "/blocks.4/self_attn/k_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_2_output_0", "/blocks.4/self_attn/Unsqueeze_3_output_0", "/blocks.4/self_attn/Concat_1_output_0", "/blocks.4/self_attn/Reshape_1_output_0", "/blocks.4/self_attn/Mul_2_output_0", "/blocks.4/self_attn/Shape_3_output_0", "Shape673", "Rank675", "BinaryOp677", "Unsqueeze678", "BinaryOp680", "Unsqueeze681", "StridedSlice684", "Squeeze685", "BinaryOp686", "BinaryOp687", "/blocks.4/self_attn/Gather_3_output_0", "/blocks.4/self_attn/Div_1_output_0", "/blocks.4/self_attn/Unsqueeze_9_output_0", "/blocks.4/self_attn/Slice_3_output_0", "/blocks.4/self_attn/Neg_1_output_0", "/blocks.4/self_attn/Unsqueeze_8_output_0", "/blocks.4/self_attn/Slice_2_output_0", "/blocks.4/self_attn/Concat_4_output_0", "/blocks.4/self_attn/Mul_3_output_0", "/blocks.4/self_attn/Add_1_output_0", "/blocks.4/self_attn/v_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_4_output_0", "/blocks.4/self_attn/Unsqueeze_5_output_0", "/blocks.4/self_attn/Concat_2_output_0", "/blocks.4/self_attn/Reshape_2_output_0", "/blocks.4/self_attn/fused_attn/FusedAttention_output_0", "/blocks.4/self_attn/o_proj/FakeLinear_output_0", "/blocks.4/Add_output_0", "/blocks.4/post_attention_layernorm/Mul_1_output_0", "/blocks.4/mlp/gate_proj/FakeLinear_output_0", "/blocks.4/mlp/act_fn/Mul_output_0", "/blocks.4/mlp/up_proj/FakeLinear_output_0", "/blocks.4/mlp/Mul_output_0", "/blocks.4/mlp/down_proj/FakeLinear_output_0", "/blocks.4/Add_1_output_0", "/blocks.5/Reshape_output_0", "/blocks.5/input_layernorm/Mul_1_output_0", "/blocks.5/self_attn/q_proj/FakeLinear_output_0", "/blocks.5/self_attn/Shape_output_0", "Shape733", "Rank735", "BinaryOp737", "Unsqueeze738", "BinaryOp740", "Unsqueeze741", "StridedSlice744", "Squeeze745", "BinaryOp747", "/blocks.5/self_attn/Gather_output_0", "/blocks.5/self_attn/Unsqueeze_output_0", "Unsqueeze755", "Unsqueeze758", "StridedSlice761", "Squeeze762", "BinaryOp763", "BinaryOp764", "/blocks.5/self_attn/Gather_1_output_0", "/blocks.5/self_attn/Unsqueeze_1_output_0", "/blocks.5/self_attn/Concat_output_0", "/blocks.5/self_attn/Reshape_output_0", "/blocks.5/self_attn/Mul_output_0", "/blocks.5/self_attn/Shape_2_output_0", "Shape771", "Rank773", "BinaryOp775", "Unsqueeze776", "BinaryOp778", "Unsqueeze779", "StridedSlice782", "Squeeze783", "BinaryOp784", "BinaryOp785", "/blocks.5/self_attn/Gather_2_output_0", "/blocks.5/self_attn/Div_output_0", "/blocks.5/self_attn/Unsqueeze_7_output_0", "/blocks.5/self_attn/Slice_1_output_0", "/blocks.5/self_attn/Neg_output_0", "/blocks.5/self_attn/Unsqueeze_6_output_0", "/blocks.5/self_attn/Slice_output_0", "/blocks.5/self_attn/Concat_3_output_0", "/blocks.5/self_attn/Mul_1_output_0", "/blocks.5/self_attn/Add_output_0", "/blocks.5/self_attn/k_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_2_output_0", "/blocks.5/self_attn/Unsqueeze_3_output_0", "/blocks.5/self_attn/Concat_1_output_0", "/blocks.5/self_attn/Reshape_1_output_0", "/blocks.5/self_attn/Mul_2_output_0", "/blocks.5/self_attn/Shape_3_output_0", "Shape804", "Rank806", "BinaryOp808", "Unsqueeze809", "BinaryOp811", "Unsqueeze812", "StridedSlice815", "Squeeze816", "BinaryOp817", "BinaryOp818", "/blocks.5/self_attn/Gather_3_output_0", "/blocks.5/self_attn/Div_1_output_0", "/blocks.5/self_attn/Unsqueeze_9_output_0", "/blocks.5/self_attn/Slice_3_output_0", "/blocks.5/self_attn/Neg_1_output_0", "/blocks.5/self_attn/Unsqueeze_8_output_0", "/blocks.5/self_attn/Slice_2_output_0", "/blocks.5/self_attn/Concat_4_output_0", "/blocks.5/self_attn/Mul_3_output_0", "/blocks.5/self_attn/Add_1_output_0", "/blocks.5/self_attn/v_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_4_output_0", "/blocks.5/self_attn/Unsqueeze_5_output_0", "/blocks.5/self_attn/Concat_2_output_0", "/blocks.5/self_attn/Reshape_2_output_0", "/blocks.5/self_attn/fused_attn/FusedAttention_output_0", "/blocks.5/self_attn/o_proj/FakeLinear_output_0", "/blocks.5/Add_output_0", "/blocks.5/post_attention_layernorm/Mul_1_output_0", "/blocks.5/mlp/gate_proj/FakeLinear_output_0", "/blocks.5/mlp/act_fn/Mul_output_0", "/blocks.5/mlp/up_proj/FakeLinear_output_0", "/blocks.5/mlp/Mul_output_0", "/blocks.5/mlp/down_proj/FakeLinear_output_0", "/blocks.5/Add_1_output_0", "/blocks.6/Reshape_output_0", "/blocks.6/input_layernorm/Mul_1_output_0", "/blocks.6/self_attn/q_proj/FakeLinear_output_0", "/blocks.6/self_attn/Shape_output_0", "Shape864", "Rank866", "BinaryOp868", "Unsqueeze869", "BinaryOp871", "Unsqueeze872", "StridedSlice875", "Squeeze876", "BinaryOp878", "/blocks.6/self_attn/Gather_output_0", "/blocks.6/self_attn/Unsqueeze_output_0", "Unsqueeze886", "Unsqueeze889", "StridedSlice892", "Squeeze893", "BinaryOp894", "BinaryOp895", "/blocks.6/self_attn/Gather_1_output_0", "/blocks.6/self_attn/Unsqueeze_1_output_0", "/blocks.6/self_attn/Concat_output_0", "/blocks.6/self_attn/Reshape_output_0", "/blocks.6/self_attn/Mul_output_0", "/blocks.6/self_attn/Shape_2_output_0", "Shape902", "Rank904", "BinaryOp906", "Unsqueeze907", "BinaryOp909", "Unsqueeze910", "StridedSlice913", "Squeeze914", "BinaryOp915", "BinaryOp916", "/blocks.6/self_attn/Gather_2_output_0", "/blocks.6/self_attn/Div_output_0", "/blocks.6/self_attn/Unsqueeze_7_output_0", "/blocks.6/self_attn/Slice_1_output_0", "/blocks.6/self_attn/Neg_output_0", "/blocks.6/self_attn/Unsqueeze_6_output_0", "/blocks.6/self_attn/Slice_output_0", "/blocks.6/self_attn/Concat_3_output_0", "/blocks.6/self_attn/Mul_1_output_0", "/blocks.6/self_attn/Add_output_0", "/blocks.6/self_attn/k_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_2_output_0", "/blocks.6/self_attn/Unsqueeze_3_output_0", "/blocks.6/self_attn/Concat_1_output_0", "/blocks.6/self_attn/Reshape_1_output_0", "/blocks.6/self_attn/Mul_2_output_0", "/blocks.6/self_attn/Shape_3_output_0", "Shape935", "Rank937", "BinaryOp939", "Unsqueeze940", "BinaryOp942", "Unsqueeze943", "StridedSlice946", "Squeeze947", "BinaryOp948", "BinaryOp949", "/blocks.6/self_attn/Gather_3_output_0", "/blocks.6/self_attn/Div_1_output_0", "/blocks.6/self_attn/Unsqueeze_9_output_0", "/blocks.6/self_attn/Slice_3_output_0", "/blocks.6/self_attn/Neg_1_output_0", "/blocks.6/self_attn/Unsqueeze_8_output_0", "/blocks.6/self_attn/Slice_2_output_0", "/blocks.6/self_attn/Concat_4_output_0", "/blocks.6/self_attn/Mul_3_output_0", "/blocks.6/self_attn/Add_1_output_0", "/blocks.6/self_attn/v_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_4_output_0", "/blocks.6/self_attn/Unsqueeze_5_output_0", "/blocks.6/self_attn/Concat_2_output_0", "/blocks.6/self_attn/Reshape_2_output_0", "/blocks.6/self_attn/fused_attn/FusedAttention_output_0", "/blocks.6/self_attn/o_proj/FakeLinear_output_0", "/blocks.6/Add_output_0", "/blocks.6/post_attention_layernorm/Mul_1_output_0", "/blocks.6/mlp/gate_proj/FakeLinear_output_0", "/blocks.6/mlp/act_fn/Mul_output_0", "/blocks.6/mlp/up_proj/FakeLinear_output_0", "/blocks.6/mlp/Mul_output_0", "/blocks.6/mlp/down_proj/FakeLinear_output_0", "/blocks.6/Add_1_output_0", "/blocks.7/Reshape_output_0", "/blocks.7/input_layernorm/Mul_1_output_0", "/blocks.7/self_attn/q_proj/FakeLinear_output_0", "/blocks.7/self_attn/Shape_output_0", "Shape995", "Rank997", "BinaryOp999", "Unsqueeze1000", "BinaryOp1002", "Unsqueeze1003", "StridedSlice1006", "Squeeze1007", "BinaryOp1009", "/blocks.7/self_attn/Gather_output_0", "/blocks.7/self_attn/Unsqueeze_output_0", "Unsqueeze1017", "Unsqueeze1020", "StridedSlice1023", "Squeeze1024", "BinaryOp1025", "BinaryOp1026", "/blocks.7/self_attn/Gather_1_output_0", "/blocks.7/self_attn/Unsqueeze_1_output_0", "/blocks.7/self_attn/Concat_output_0", "/blocks.7/self_attn/Reshape_output_0", "/blocks.7/self_attn/Mul_output_0", "/blocks.7/self_attn/Shape_2_output_0", "Shape1033", "Rank1035", "BinaryOp1037", "Unsqueeze1038", "BinaryOp1040", "Unsqueeze1041", "StridedSlice1044", "Squeeze1045", "BinaryOp1046", "BinaryOp1047", "/blocks.7/self_attn/Gather_2_output_0", "/blocks.7/self_attn/Div_output_0", "/blocks.7/self_attn/Unsqueeze_7_output_0", "/blocks.7/self_attn/Slice_1_output_0", "/blocks.7/self_attn/Neg_output_0", "/blocks.7/self_attn/Unsqueeze_6_output_0", "/blocks.7/self_attn/Slice_output_0", "/blocks.7/self_attn/Concat_3_output_0", "/blocks.7/self_attn/Mul_1_output_0", "/blocks.7/self_attn/Add_output_0", "/blocks.7/self_attn/k_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_2_output_0", "/blocks.7/self_attn/Unsqueeze_3_output_0", "/blocks.7/self_attn/Concat_1_output_0", "/blocks.7/self_attn/Reshape_1_output_0", "/blocks.7/self_attn/Mul_2_output_0", "/blocks.7/self_attn/Shape_3_output_0", "Shape1066", "Rank1068", "BinaryOp1070", "Unsqueeze1071", "BinaryOp1073", "Unsqueeze1074", "StridedSlice1077", "Squeeze1078", "BinaryOp1079", "BinaryOp1080", "/blocks.7/self_attn/Gather_3_output_0", "/blocks.7/self_attn/Div_1_output_0", "/blocks.7/self_attn/Unsqueeze_9_output_0", "/blocks.7/self_attn/Slice_3_output_0", "/blocks.7/self_attn/Neg_1_output_0", "/blocks.7/self_attn/Unsqueeze_8_output_0", "/blocks.7/self_attn/Slice_2_output_0", "/blocks.7/self_attn/Concat_4_output_0", "/blocks.7/self_attn/Mul_3_output_0", "/blocks.7/self_attn/Add_1_output_0", "/blocks.7/self_attn/v_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_4_output_0", "/blocks.7/self_attn/Unsqueeze_5_output_0", "/blocks.7/self_attn/Concat_2_output_0", "/blocks.7/self_attn/Reshape_2_output_0", "/blocks.7/self_attn/fused_attn/FusedAttention_output_0", "/blocks.7/self_attn/o_proj/FakeLinear_output_0", "/blocks.7/Add_output_0", "/blocks.7/post_attention_layernorm/Mul_1_output_0", "/blocks.7/mlp/gate_proj/FakeLinear_output_0", "/blocks.7/mlp/act_fn/Mul_output_0", "/blocks.7/mlp/up_proj/FakeLinear_output_0", "/blocks.7/mlp/Mul_output_0", "/blocks.7/mlp/down_proj/FakeLinear_output_0", "/blocks.7/Add_1_output_0", "/blocks.8/Reshape_output_0", "/blocks.8/input_layernorm/Mul_1_output_0", "/blocks.8/self_attn/q_proj/FakeLinear_output_0", "/blocks.8/self_attn/Shape_output_0", "Shape1126", "Rank1128", "BinaryOp1130", "Unsqueeze1131", "BinaryOp1133", "Unsqueeze1134", "StridedSlice1137", "Squeeze1138", "BinaryOp1140", "/blocks.8/self_attn/Gather_output_0", "/blocks.8/self_attn/Unsqueeze_output_0", "Unsqueeze1148", "Unsqueeze1151", "StridedSlice1154", "Squeeze1155", "BinaryOp1156", "BinaryOp1157", "/blocks.8/self_attn/Gather_1_output_0", "/blocks.8/self_attn/Unsqueeze_1_output_0", "/blocks.8/self_attn/Concat_output_0", "/blocks.8/self_attn/Reshape_output_0", "/blocks.8/self_attn/Mul_output_0", "/blocks.8/self_attn/Shape_2_output_0", "Shape1164", "Rank1166", "BinaryOp1168", "Unsqueeze1169", "BinaryOp1171", "Unsqueeze1172", "StridedSlice1175", "Squeeze1176", "BinaryOp1177", "BinaryOp1178", "/blocks.8/self_attn/Gather_2_output_0", "/blocks.8/self_attn/Div_output_0", "/blocks.8/self_attn/Unsqueeze_7_output_0", "/blocks.8/self_attn/Slice_1_output_0", "/blocks.8/self_attn/Neg_output_0", "/blocks.8/self_attn/Unsqueeze_6_output_0", "/blocks.8/self_attn/Slice_output_0", "/blocks.8/self_attn/Concat_3_output_0", "/blocks.8/self_attn/Mul_1_output_0", "/blocks.8/self_attn/Add_output_0", "/blocks.8/self_attn/k_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_2_output_0", "/blocks.8/self_attn/Unsqueeze_3_output_0", "/blocks.8/self_attn/Concat_1_output_0", "/blocks.8/self_attn/Reshape_1_output_0", "/blocks.8/self_attn/Mul_2_output_0", "/blocks.8/self_attn/Shape_3_output_0", "Shape1197", "Rank1199", "BinaryOp1201", "Unsqueeze1202", "BinaryOp1204", "Unsqueeze1205", "StridedSlice1208", "Squeeze1209", "BinaryOp1210", "BinaryOp1211", "/blocks.8/self_attn/Gather_3_output_0", "/blocks.8/self_attn/Div_1_output_0", "/blocks.8/self_attn/Unsqueeze_9_output_0", "/blocks.8/self_attn/Slice_3_output_0", "/blocks.8/self_attn/Neg_1_output_0", "/blocks.8/self_attn/Unsqueeze_8_output_0", "/blocks.8/self_attn/Slice_2_output_0", "/blocks.8/self_attn/Concat_4_output_0", "/blocks.8/self_attn/Mul_3_output_0", "/blocks.8/self_attn/Add_1_output_0", "/blocks.8/self_attn/v_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_4_output_0", "/blocks.8/self_attn/Unsqueeze_5_output_0", "/blocks.8/self_attn/Concat_2_output_0", "/blocks.8/self_attn/Reshape_2_output_0", "/blocks.8/self_attn/fused_attn/FusedAttention_output_0", "/blocks.8/self_attn/o_proj/FakeLinear_output_0", "/blocks.8/Add_output_0", "/blocks.8/post_attention_layernorm/Mul_1_output_0", "/blocks.8/mlp/gate_proj/FakeLinear_output_0", "/blocks.8/mlp/act_fn/Mul_output_0", "/blocks.8/mlp/up_proj/FakeLinear_output_0", "/blocks.8/mlp/Mul_output_0", "/blocks.8/mlp/down_proj/FakeLinear_output_0", "/blocks.8/Add_1_output_0", "/blocks.9/Reshape_output_0", "/blocks.9/input_layernorm/Mul_1_output_0", "/blocks.9/self_attn/q_proj/FakeLinear_output_0", "/blocks.9/self_attn/Shape_output_0", "Shape1257", "Rank1259", "BinaryOp1261", "Unsqueeze1262", "BinaryOp1264", "Unsqueeze1265", "StridedSlice1268", "Squeeze1269", "BinaryOp1271", "/blocks.9/self_attn/Gather_output_0", "/blocks.9/self_attn/Unsqueeze_output_0", "Unsqueeze1279", "Unsqueeze1282", "StridedSlice1285", "Squeeze1286", "BinaryOp1287", "BinaryOp1288", "/blocks.9/self_attn/Gather_1_output_0", "/blocks.9/self_attn/Unsqueeze_1_output_0", "/blocks.9/self_attn/Concat_output_0", "/blocks.9/self_attn/Reshape_output_0", "/blocks.9/self_attn/Mul_output_0", "/blocks.9/self_attn/Shape_2_output_0", "Shape1295", "Rank1297", "BinaryOp1299", "Unsqueeze1300", "BinaryOp1302", "Unsqueeze1303", "StridedSlice1306", "Squeeze1307", "BinaryOp1308", "BinaryOp1309", "/blocks.9/self_attn/Gather_2_output_0", "/blocks.9/self_attn/Div_output_0", "/blocks.9/self_attn/Unsqueeze_7_output_0", "/blocks.9/self_attn/Slice_1_output_0", "/blocks.9/self_attn/Neg_output_0", "/blocks.9/self_attn/Unsqueeze_6_output_0", "/blocks.9/self_attn/Slice_output_0", "/blocks.9/self_attn/Concat_3_output_0", "/blocks.9/self_attn/Mul_1_output_0", "/blocks.9/self_attn/Add_output_0", "/blocks.9/self_attn/k_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_2_output_0", "/blocks.9/self_attn/Unsqueeze_3_output_0", "/blocks.9/self_attn/Concat_1_output_0", "/blocks.9/self_attn/Reshape_1_output_0", "/blocks.9/self_attn/Mul_2_output_0", "/blocks.9/self_attn/Shape_3_output_0", "Shape1328", "Rank1330", "BinaryOp1332", "Unsqueeze1333", "BinaryOp1335", "Unsqueeze1336", "StridedSlice1339", "Squeeze1340", "BinaryOp1341", "BinaryOp1342", "/blocks.9/self_attn/Gather_3_output_0", "/blocks.9/self_attn/Div_1_output_0", "/blocks.9/self_attn/Unsqueeze_9_output_0", "/blocks.9/self_attn/Slice_3_output_0", "/blocks.9/self_attn/Neg_1_output_0", "/blocks.9/self_attn/Unsqueeze_8_output_0", "/blocks.9/self_attn/Slice_2_output_0", "/blocks.9/self_attn/Concat_4_output_0", "/blocks.9/self_attn/Mul_3_output_0", "/blocks.9/self_attn/Add_1_output_0", "/blocks.9/self_attn/v_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_4_output_0", "/blocks.9/self_attn/Unsqueeze_5_output_0", "/blocks.9/self_attn/Concat_2_output_0", "/blocks.9/self_attn/Reshape_2_output_0", "/blocks.9/self_attn/fused_attn/FusedAttention_output_0", "/blocks.9/self_attn/o_proj/FakeLinear_output_0", "/blocks.9/Add_output_0", "/blocks.9/post_attention_layernorm/Mul_1_output_0", "/blocks.9/mlp/gate_proj/FakeLinear_output_0", "/blocks.9/mlp/act_fn/Mul_output_0", "/blocks.9/mlp/up_proj/FakeLinear_output_0", "/blocks.9/mlp/Mul_output_0", "/blocks.9/mlp/down_proj/FakeLinear_output_0", "/blocks.9/Add_1_output_0", "/blocks.10/Reshape_output_0", "/blocks.10/input_layernorm/Mul_1_output_0", "/blocks.10/self_attn/q_proj/FakeLinear_output_0", "/blocks.10/self_attn/Shape_output_0", "Shape1388", "Rank1390", "BinaryOp1392", "Unsqueeze1393", "BinaryOp1395", "Unsqueeze1396", "StridedSlice1399", "Squeeze1400", "BinaryOp1402", "/blocks.10/self_attn/Gather_output_0", "/blocks.10/self_attn/Unsqueeze_output_0", "Unsqueeze1410", "Unsqueeze1413", "StridedSlice1416", "Squeeze1417", "BinaryOp1418", "BinaryOp1419", "/blocks.10/self_attn/Gather_1_output_0", "/blocks.10/self_attn/Unsqueeze_1_output_0", "/blocks.10/self_attn/Concat_output_0", "/blocks.10/self_attn/Reshape_output_0", "/blocks.10/self_attn/Mul_output_0", "/blocks.10/self_attn/Shape_2_output_0", "Shape1426", "Rank1428", "BinaryOp1430", "Unsqueeze1431", "BinaryOp1433", "Unsqueeze1434", "StridedSlice1437", "Squeeze1438", "BinaryOp1439", "BinaryOp1440", "/blocks.10/self_attn/Gather_2_output_0", "/blocks.10/self_attn/Div_output_0", "/blocks.10/self_attn/Unsqueeze_7_output_0", "/blocks.10/self_attn/Slice_1_output_0", "/blocks.10/self_attn/Neg_output_0", "/blocks.10/self_attn/Unsqueeze_6_output_0", "/blocks.10/self_attn/Slice_output_0", "/blocks.10/self_attn/Concat_3_output_0", "/blocks.10/self_attn/Mul_1_output_0", "/blocks.10/self_attn/Add_output_0", "/blocks.10/self_attn/k_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_2_output_0", "/blocks.10/self_attn/Unsqueeze_3_output_0", "/blocks.10/self_attn/Concat_1_output_0", "/blocks.10/self_attn/Reshape_1_output_0", "/blocks.10/self_attn/Mul_2_output_0", "/blocks.10/self_attn/Shape_3_output_0", "Shape1459", "Rank1461", "BinaryOp1463", "Unsqueeze1464", "BinaryOp1466", "Unsqueeze1467", "StridedSlice1470", "Squeeze1471", "BinaryOp1472", "BinaryOp1473", "/blocks.10/self_attn/Gather_3_output_0", "/blocks.10/self_attn/Div_1_output_0", "/blocks.10/self_attn/Unsqueeze_9_output_0", "/blocks.10/self_attn/Slice_3_output_0", "/blocks.10/self_attn/Neg_1_output_0", "/blocks.10/self_attn/Unsqueeze_8_output_0", "/blocks.10/self_attn/Slice_2_output_0", "/blocks.10/self_attn/Concat_4_output_0", "/blocks.10/self_attn/Mul_3_output_0", "/blocks.10/self_attn/Add_1_output_0", "/blocks.10/self_attn/v_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_4_output_0", "/blocks.10/self_attn/Unsqueeze_5_output_0", "/blocks.10/self_attn/Concat_2_output_0", "/blocks.10/self_attn/Reshape_2_output_0", "/blocks.10/self_attn/fused_attn/FusedAttention_output_0", "/blocks.10/self_attn/o_proj/FakeLinear_output_0", "/blocks.10/Add_output_0", "/blocks.10/post_attention_layernorm/Mul_1_output_0", "/blocks.10/mlp/gate_proj/FakeLinear_output_0", "/blocks.10/mlp/act_fn/Mul_output_0", "/blocks.10/mlp/up_proj/FakeLinear_output_0", "/blocks.10/mlp/Mul_output_0", "/blocks.10/mlp/down_proj/FakeLinear_output_0", "/blocks.10/Add_1_output_0", "/blocks.11/Reshape_output_0", "/blocks.11/input_layernorm/Mul_1_output_0", "/blocks.11/self_attn/q_proj/FakeLinear_output_0", "/blocks.11/self_attn/Shape_output_0", "Shape1519", "Rank1521", "BinaryOp1523", "Unsqueeze1524", "BinaryOp1526", "Unsqueeze1527", "StridedSlice1530", "Squeeze1531", "BinaryOp1533", "/blocks.11/self_attn/Gather_output_0", "/blocks.11/self_attn/Unsqueeze_output_0", "Unsqueeze1541", "Unsqueeze1544", "StridedSlice1547", "Squeeze1548", "BinaryOp1549", "BinaryOp1550", "/blocks.11/self_attn/Gather_1_output_0", "/blocks.11/self_attn/Unsqueeze_1_output_0", "/blocks.11/self_attn/Concat_output_0", "/blocks.11/self_attn/Reshape_output_0", "/blocks.11/self_attn/Mul_output_0", "/blocks.11/self_attn/Shape_2_output_0", "Shape1557", "Rank1559", "BinaryOp1561", "Unsqueeze1562", "BinaryOp1564", "Unsqueeze1565", "StridedSlice1568", "Squeeze1569", "BinaryOp1570", "BinaryOp1571", "/blocks.11/self_attn/Gather_2_output_0", "/blocks.11/self_attn/Div_output_0", "/blocks.11/self_attn/Unsqueeze_7_output_0", "/blocks.11/self_attn/Slice_1_output_0", "/blocks.11/self_attn/Neg_output_0", "/blocks.11/self_attn/Unsqueeze_6_output_0", "/blocks.11/self_attn/Slice_output_0", "/blocks.11/self_attn/Concat_3_output_0", "/blocks.11/self_attn/Mul_1_output_0", "/blocks.11/self_attn/Add_output_0", "/blocks.11/self_attn/k_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_2_output_0", "/blocks.11/self_attn/Unsqueeze_3_output_0", "/blocks.11/self_attn/Concat_1_output_0", "/blocks.11/self_attn/Reshape_1_output_0", "/blocks.11/self_attn/Mul_2_output_0", "/blocks.11/self_attn/Shape_3_output_0", "Shape1590", "Rank1592", "BinaryOp1594", "Unsqueeze1595", "BinaryOp1597", "Unsqueeze1598", "StridedSlice1601", "Squeeze1602", "BinaryOp1603", "BinaryOp1604", "/blocks.11/self_attn/Gather_3_output_0", "/blocks.11/self_attn/Div_1_output_0", "/blocks.11/self_attn/Unsqueeze_9_output_0", "/blocks.11/self_attn/Slice_3_output_0", "/blocks.11/self_attn/Neg_1_output_0", "/blocks.11/self_attn/Unsqueeze_8_output_0", "/blocks.11/self_attn/Slice_2_output_0", "/blocks.11/self_attn/Concat_4_output_0", "/blocks.11/self_attn/Mul_3_output_0", "/blocks.11/self_attn/Add_1_output_0", "/blocks.11/self_attn/v_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_4_output_0", "/blocks.11/self_attn/Unsqueeze_5_output_0", "/blocks.11/self_attn/Concat_2_output_0", "/blocks.11/self_attn/Reshape_2_output_0", "/blocks.11/self_attn/fused_attn/FusedAttention_output_0", "/blocks.11/self_attn/o_proj/FakeLinear_output_0", "/blocks.11/Add_output_0", "/blocks.11/post_attention_layernorm/Mul_1_output_0", "/blocks.11/mlp/gate_proj/FakeLinear_output_0", "/blocks.11/mlp/act_fn/Mul_output_0", "/blocks.11/mlp/up_proj/FakeLinear_output_0", "/blocks.11/mlp/Mul_output_0", "/blocks.11/mlp/down_proj/FakeLinear_output_0", "/blocks.11/Add_1_output_0", "/blocks.12/Reshape_output_0", "/blocks.12/input_layernorm/Mul_1_output_0", "/blocks.12/self_attn/q_proj/FakeLinear_output_0", "/blocks.12/self_attn/Shape_output_0", "Shape1650", "Rank1652", "BinaryOp1654", "Unsqueeze1655", "BinaryOp1657", "Unsqueeze1658", "StridedSlice1661", "Squeeze1662", "BinaryOp1664", "/blocks.12/self_attn/Gather_output_0", "/blocks.12/self_attn/Unsqueeze_output_0", "Unsqueeze1672", "Unsqueeze1675", "StridedSlice1678", "Squeeze1679", "BinaryOp1680", "BinaryOp1681", "/blocks.12/self_attn/Gather_1_output_0", "/blocks.12/self_attn/Unsqueeze_1_output_0", "/blocks.12/self_attn/Concat_output_0", "/blocks.12/self_attn/Reshape_output_0", "/blocks.12/self_attn/Mul_output_0", "/blocks.12/self_attn/Shape_2_output_0", "Shape1688", "Rank1690", "BinaryOp1692", "Unsqueeze1693", "BinaryOp1695", "Unsqueeze1696", "StridedSlice1699", "Squeeze1700", "BinaryOp1701", "BinaryOp1702", "/blocks.12/self_attn/Gather_2_output_0", "/blocks.12/self_attn/Div_output_0", "/blocks.12/self_attn/Unsqueeze_7_output_0", "/blocks.12/self_attn/Slice_1_output_0", "/blocks.12/self_attn/Neg_output_0", "/blocks.12/self_attn/Unsqueeze_6_output_0", "/blocks.12/self_attn/Slice_output_0", "/blocks.12/self_attn/Concat_3_output_0", "/blocks.12/self_attn/Mul_1_output_0", "/blocks.12/self_attn/Add_output_0", "/blocks.12/self_attn/k_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_2_output_0", "/blocks.12/self_attn/Unsqueeze_3_output_0", "/blocks.12/self_attn/Concat_1_output_0", "/blocks.12/self_attn/Reshape_1_output_0", "/blocks.12/self_attn/Mul_2_output_0", "/blocks.12/self_attn/Shape_3_output_0", "Shape1721", "Rank1723", "BinaryOp1725", "Unsqueeze1726", "BinaryOp1728", "Unsqueeze1729", "StridedSlice1732", "Squeeze1733", "BinaryOp1734", "BinaryOp1735", "/blocks.12/self_attn/Gather_3_output_0", "/blocks.12/self_attn/Div_1_output_0", "/blocks.12/self_attn/Unsqueeze_9_output_0", "/blocks.12/self_attn/Slice_3_output_0", "/blocks.12/self_attn/Neg_1_output_0", "/blocks.12/self_attn/Unsqueeze_8_output_0", "/blocks.12/self_attn/Slice_2_output_0", "/blocks.12/self_attn/Concat_4_output_0", "/blocks.12/self_attn/Mul_3_output_0", "/blocks.12/self_attn/Add_1_output_0", "/blocks.12/self_attn/v_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_4_output_0", "/blocks.12/self_attn/Unsqueeze_5_output_0", "/blocks.12/self_attn/Concat_2_output_0", "/blocks.12/self_attn/Reshape_2_output_0", "/blocks.12/self_attn/fused_attn/FusedAttention_output_0", "/blocks.12/self_attn/o_proj/FakeLinear_output_0", "/blocks.12/Add_output_0", "/blocks.12/post_attention_layernorm/Mul_1_output_0", "/blocks.12/mlp/gate_proj/FakeLinear_output_0", "/blocks.12/mlp/act_fn/Mul_output_0", "/blocks.12/mlp/up_proj/FakeLinear_output_0", "/blocks.12/mlp/Mul_output_0", "/blocks.12/mlp/down_proj/FakeLinear_output_0", "/blocks.12/Add_1_output_0", "/blocks.13/Reshape_output_0", "/blocks.13/input_layernorm/Mul_1_output_0", "/blocks.13/self_attn/q_proj/FakeLinear_output_0", "/blocks.13/self_attn/Shape_output_0", "Shape1781", "Rank1783", "BinaryOp1785", "Unsqueeze1786", "BinaryOp1788", "Unsqueeze1789", "StridedSlice1792", "Squeeze1793", "BinaryOp1795", "/blocks.13/self_attn/Gather_output_0", "/blocks.13/self_attn/Unsqueeze_output_0", "Unsqueeze1803", "Unsqueeze1806", "StridedSlice1809", "Squeeze1810", "BinaryOp1811", "BinaryOp1812", "/blocks.13/self_attn/Gather_1_output_0", "/blocks.13/self_attn/Unsqueeze_1_output_0", "/blocks.13/self_attn/Concat_output_0", "/blocks.13/self_attn/Reshape_output_0", "/blocks.13/self_attn/Mul_output_0", "/blocks.13/self_attn/Shape_2_output_0", "Shape1819", "Rank1821", "BinaryOp1823", "Unsqueeze1824", "BinaryOp1826", "Unsqueeze1827", "StridedSlice1830", "Squeeze1831", "BinaryOp1832", "BinaryOp1833", "/blocks.13/self_attn/Gather_2_output_0", "/blocks.13/self_attn/Div_output_0", "/blocks.13/self_attn/Unsqueeze_7_output_0", "/blocks.13/self_attn/Slice_1_output_0", "/blocks.13/self_attn/Neg_output_0", "/blocks.13/self_attn/Unsqueeze_6_output_0", "/blocks.13/self_attn/Slice_output_0", "/blocks.13/self_attn/Concat_3_output_0", "/blocks.13/self_attn/Mul_1_output_0", "/blocks.13/self_attn/Add_output_0", "/blocks.13/self_attn/k_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_2_output_0", "/blocks.13/self_attn/Unsqueeze_3_output_0", "/blocks.13/self_attn/Concat_1_output_0", "/blocks.13/self_attn/Reshape_1_output_0", "/blocks.13/self_attn/Mul_2_output_0", "/blocks.13/self_attn/Shape_3_output_0", "Shape1852", "Rank1854", "BinaryOp1856", "Unsqueeze1857", "BinaryOp1859", "Unsqueeze1860", "StridedSlice1863", "Squeeze1864", "BinaryOp1865", "BinaryOp1866", "/blocks.13/self_attn/Gather_3_output_0", "/blocks.13/self_attn/Div_1_output_0", "/blocks.13/self_attn/Unsqueeze_9_output_0", "/blocks.13/self_attn/Slice_3_output_0", "/blocks.13/self_attn/Neg_1_output_0", "/blocks.13/self_attn/Unsqueeze_8_output_0", "/blocks.13/self_attn/Slice_2_output_0", "/blocks.13/self_attn/Concat_4_output_0", "/blocks.13/self_attn/Mul_3_output_0", "/blocks.13/self_attn/Add_1_output_0", "/blocks.13/self_attn/v_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_4_output_0", "/blocks.13/self_attn/Unsqueeze_5_output_0", "/blocks.13/self_attn/Concat_2_output_0", "/blocks.13/self_attn/Reshape_2_output_0", "/blocks.13/self_attn/fused_attn/FusedAttention_output_0", "/blocks.13/self_attn/o_proj/FakeLinear_output_0", "/blocks.13/Add_output_0", "/blocks.13/post_attention_layernorm/Mul_1_output_0", "/blocks.13/mlp/gate_proj/FakeLinear_output_0", "/blocks.13/mlp/act_fn/Mul_output_0", "/blocks.13/mlp/up_proj/FakeLinear_output_0", "/blocks.13/mlp/Mul_output_0", "/blocks.13/mlp/down_proj/FakeLinear_output_0", "/blocks.13/Add_1_output_0", "/blocks.14/Reshape_output_0", "/blocks.14/input_layernorm/Mul_1_output_0", "/blocks.14/self_attn/q_proj/FakeLinear_output_0", "/blocks.14/self_attn/Shape_output_0", "Shape1912", "Rank1914", "BinaryOp1916", "Unsqueeze1917", "BinaryOp1919", "Unsqueeze1920", "StridedSlice1923", "Squeeze1924", "BinaryOp1926", "/blocks.14/self_attn/Gather_output_0", "/blocks.14/self_attn/Unsqueeze_output_0", "Unsqueeze1934", "Unsqueeze1937", "StridedSlice1940", "Squeeze1941", "BinaryOp1942", "BinaryOp1943", "/blocks.14/self_attn/Gather_1_output_0", "/blocks.14/self_attn/Unsqueeze_1_output_0", "/blocks.14/self_attn/Concat_output_0", "/blocks.14/self_attn/Reshape_output_0", "/blocks.14/self_attn/Mul_output_0", "/blocks.14/self_attn/Shape_2_output_0", "Shape1950", "Rank1952", "BinaryOp1954", "Unsqueeze1955", "BinaryOp1957", "Unsqueeze1958", "StridedSlice1961", "Squeeze1962", "BinaryOp1963", "BinaryOp1964", "/blocks.14/self_attn/Gather_2_output_0", "/blocks.14/self_attn/Div_output_0", "/blocks.14/self_attn/Unsqueeze_7_output_0", "/blocks.14/self_attn/Slice_1_output_0", "/blocks.14/self_attn/Neg_output_0", "/blocks.14/self_attn/Unsqueeze_6_output_0", "/blocks.14/self_attn/Slice_output_0", "/blocks.14/self_attn/Concat_3_output_0", "/blocks.14/self_attn/Mul_1_output_0", "/blocks.14/self_attn/Add_output_0", "/blocks.14/self_attn/k_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_2_output_0", "/blocks.14/self_attn/Unsqueeze_3_output_0", "/blocks.14/self_attn/Concat_1_output_0", "/blocks.14/self_attn/Reshape_1_output_0", "/blocks.14/self_attn/Mul_2_output_0", "/blocks.14/self_attn/Shape_3_output_0", "Shape1983", "Rank1985", "BinaryOp1987", "Unsqueeze1988", "BinaryOp1990", "Unsqueeze1991", "StridedSlice1994", "Squeeze1995", "BinaryOp1996", "BinaryOp1997", "/blocks.14/self_attn/Gather_3_output_0", "/blocks.14/self_attn/Div_1_output_0", "/blocks.14/self_attn/Unsqueeze_9_output_0", "/blocks.14/self_attn/Slice_3_output_0", "/blocks.14/self_attn/Neg_1_output_0", "/blocks.14/self_attn/Unsqueeze_8_output_0", "/blocks.14/self_attn/Slice_2_output_0", "/blocks.14/self_attn/Concat_4_output_0", "/blocks.14/self_attn/Mul_3_output_0", "/blocks.14/self_attn/Add_1_output_0", "/blocks.14/self_attn/v_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_4_output_0", "/blocks.14/self_attn/Unsqueeze_5_output_0", "/blocks.14/self_attn/Concat_2_output_0", "/blocks.14/self_attn/Reshape_2_output_0", "/blocks.14/self_attn/fused_attn/FusedAttention_output_0", "/blocks.14/self_attn/o_proj/FakeLinear_output_0", "/blocks.14/Add_output_0", "/blocks.14/post_attention_layernorm/Mul_1_output_0", "/blocks.14/mlp/gate_proj/FakeLinear_output_0", "/blocks.14/mlp/act_fn/Mul_output_0", "/blocks.14/mlp/up_proj/FakeLinear_output_0", "/blocks.14/mlp/Mul_output_0", "/blocks.14/mlp/down_proj/FakeLinear_output_0", "/blocks.14/Add_1_output_0", "/blocks.15/Reshape_output_0", "/blocks.15/input_layernorm/Mul_1_output_0", "/blocks.15/self_attn/q_proj/FakeLinear_output_0", "/blocks.15/self_attn/Shape_output_0", "Shape2043", "Rank2045", "BinaryOp2047", "Unsqueeze2048", "BinaryOp2050", "Unsqueeze2051", "StridedSlice2054", "Squeeze2055", "BinaryOp2057", "/blocks.15/self_attn/Gather_output_0", "/blocks.15/self_attn/Unsqueeze_output_0", "Unsqueeze2065", "Unsqueeze2068", "StridedSlice2071", "Squeeze2072", "BinaryOp2073", "BinaryOp2074", "/blocks.15/self_attn/Gather_1_output_0", "/blocks.15/self_attn/Unsqueeze_1_output_0", "/blocks.15/self_attn/Concat_output_0", "/blocks.15/self_attn/Reshape_output_0", "/blocks.15/self_attn/Mul_output_0", "/blocks.15/self_attn/Shape_2_output_0", "Shape2081", "Rank2083", "BinaryOp2085", "Unsqueeze2086", "BinaryOp2088", "Unsqueeze2089", "StridedSlice2092", "Squeeze2093", "BinaryOp2094", "BinaryOp2095", "/blocks.15/self_attn/Gather_2_output_0", "/blocks.15/self_attn/Div_output_0", "/blocks.15/self_attn/Unsqueeze_7_output_0", "/blocks.15/self_attn/Slice_1_output_0", "/blocks.15/self_attn/Neg_output_0", "/blocks.15/self_attn/Unsqueeze_6_output_0", "/blocks.15/self_attn/Slice_output_0", "/blocks.15/self_attn/Concat_3_output_0", "/blocks.15/self_attn/Mul_1_output_0", "/blocks.15/self_attn/Add_output_0", "/blocks.15/self_attn/k_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_2_output_0", "/blocks.15/self_attn/Unsqueeze_3_output_0", "/blocks.15/self_attn/Concat_1_output_0", "/blocks.15/self_attn/Reshape_1_output_0", "/blocks.15/self_attn/Mul_2_output_0", "/blocks.15/self_attn/Shape_3_output_0", "Shape2114", "Rank2116", "BinaryOp2118", "Unsqueeze2119", "BinaryOp2121", "Unsqueeze2122", "StridedSlice2125", "Squeeze2126", "BinaryOp2127", "BinaryOp2128", "/blocks.15/self_attn/Gather_3_output_0", "/blocks.15/self_attn/Div_1_output_0", "/blocks.15/self_attn/Unsqueeze_9_output_0", "/blocks.15/self_attn/Slice_3_output_0", "/blocks.15/self_attn/Neg_1_output_0", "/blocks.15/self_attn/Unsqueeze_8_output_0", "/blocks.15/self_attn/Slice_2_output_0", "/blocks.15/self_attn/Concat_4_output_0", "/blocks.15/self_attn/Mul_3_output_0", "/blocks.15/self_attn/Add_1_output_0", "/blocks.15/self_attn/v_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_4_output_0", "/blocks.15/self_attn/Unsqueeze_5_output_0", "/blocks.15/self_attn/Concat_2_output_0", "/blocks.15/self_attn/Reshape_2_output_0", "/blocks.15/self_attn/fused_attn/FusedAttention_output_0", "/blocks.15/self_attn/o_proj/FakeLinear_output_0", "/blocks.15/Add_output_0", "/blocks.15/post_attention_layernorm/Mul_1_output_0", "/blocks.15/mlp/gate_proj/FakeLinear_output_0", "/blocks.15/mlp/act_fn/Mul_output_0", "/blocks.15/mlp/up_proj/FakeLinear_output_0", "/blocks.15/mlp/Mul_output_0", "/blocks.15/mlp/down_proj/FakeLinear_output_0", "/blocks.15/Add_1_output_0", "/blocks.16/Reshape_output_0", "/blocks.16/input_layernorm/Mul_1_output_0", "/blocks.16/self_attn/q_proj/FakeLinear_output_0", "/blocks.16/self_attn/Shape_output_0", "Shape2174", "Rank2176", "BinaryOp2178", "Unsqueeze2179", "BinaryOp2181", "Unsqueeze2182", "StridedSlice2185", "Squeeze2186", "BinaryOp2188", "/blocks.16/self_attn/Gather_output_0", "/blocks.16/self_attn/Unsqueeze_output_0", "Unsqueeze2196", "Unsqueeze2199", "StridedSlice2202", "Squeeze2203", "BinaryOp2204", "BinaryOp2205", "/blocks.16/self_attn/Gather_1_output_0", "/blocks.16/self_attn/Unsqueeze_1_output_0", "/blocks.16/self_attn/Concat_output_0", "/blocks.16/self_attn/Reshape_output_0", "/blocks.16/self_attn/Mul_output_0", "/blocks.16/self_attn/Shape_2_output_0", "Shape2212", "Rank2214", "BinaryOp2216", "Unsqueeze2217", "BinaryOp2219", "Unsqueeze2220", "StridedSlice2223", "Squeeze2224", "BinaryOp2225", "BinaryOp2226", "/blocks.16/self_attn/Gather_2_output_0", "/blocks.16/self_attn/Div_output_0", "/blocks.16/self_attn/Unsqueeze_7_output_0", "/blocks.16/self_attn/Slice_1_output_0", "/blocks.16/self_attn/Neg_output_0", "/blocks.16/self_attn/Unsqueeze_6_output_0", "/blocks.16/self_attn/Slice_output_0", "/blocks.16/self_attn/Concat_3_output_0", "/blocks.16/self_attn/Mul_1_output_0", "/blocks.16/self_attn/Add_output_0", "/blocks.16/self_attn/k_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_2_output_0", "/blocks.16/self_attn/Unsqueeze_3_output_0", "/blocks.16/self_attn/Concat_1_output_0", "/blocks.16/self_attn/Reshape_1_output_0", "/blocks.16/self_attn/Mul_2_output_0", "/blocks.16/self_attn/Shape_3_output_0", "Shape2245", "Rank2247", "BinaryOp2249", "Unsqueeze2250", "BinaryOp2252", "Unsqueeze2253", "StridedSlice2256", "Squeeze2257", "BinaryOp2258", "BinaryOp2259", "/blocks.16/self_attn/Gather_3_output_0", "/blocks.16/self_attn/Div_1_output_0", "/blocks.16/self_attn/Unsqueeze_9_output_0", "/blocks.16/self_attn/Slice_3_output_0", "/blocks.16/self_attn/Neg_1_output_0", "/blocks.16/self_attn/Unsqueeze_8_output_0", "/blocks.16/self_attn/Slice_2_output_0", "/blocks.16/self_attn/Concat_4_output_0", "/blocks.16/self_attn/Mul_3_output_0", "/blocks.16/self_attn/Add_1_output_0", "/blocks.16/self_attn/v_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_4_output_0", "/blocks.16/self_attn/Unsqueeze_5_output_0", "/blocks.16/self_attn/Concat_2_output_0", "/blocks.16/self_attn/Reshape_2_output_0", "/blocks.16/self_attn/fused_attn/FusedAttention_output_0", "/blocks.16/self_attn/o_proj/FakeLinear_output_0", "/blocks.16/Add_output_0", "/blocks.16/post_attention_layernorm/Mul_1_output_0", "/blocks.16/mlp/gate_proj/FakeLinear_output_0", "/blocks.16/mlp/act_fn/Mul_output_0", "/blocks.16/mlp/up_proj/FakeLinear_output_0", "/blocks.16/mlp/Mul_output_0", "/blocks.16/mlp/down_proj/FakeLinear_output_0", "/blocks.16/Add_1_output_0", "/blocks.17/Reshape_output_0", "/blocks.17/input_layernorm/Mul_1_output_0", "/blocks.17/self_attn/q_proj/FakeLinear_output_0", "/blocks.17/self_attn/Shape_output_0", "Shape2305", "Rank2307", "BinaryOp2309", "Unsqueeze2310", "BinaryOp2312", "Unsqueeze2313", "StridedSlice2316", "Squeeze2317", "BinaryOp2319", "/blocks.17/self_attn/Gather_output_0", "/blocks.17/self_attn/Unsqueeze_output_0", "Unsqueeze2327", "Unsqueeze2330", "StridedSlice2333", "Squeeze2334", "BinaryOp2335", "BinaryOp2336", "/blocks.17/self_attn/Gather_1_output_0", "/blocks.17/self_attn/Unsqueeze_1_output_0", "/blocks.17/self_attn/Concat_output_0", "/blocks.17/self_attn/Reshape_output_0", "/blocks.17/self_attn/Mul_output_0", "/blocks.17/self_attn/Shape_2_output_0", "Shape2343", "Rank2345", "BinaryOp2347", "Unsqueeze2348", "BinaryOp2350", "Unsqueeze2351", "StridedSlice2354", "Squeeze2355", "BinaryOp2356", "BinaryOp2357", "/blocks.17/self_attn/Gather_2_output_0", "/blocks.17/self_attn/Div_output_0", "/blocks.17/self_attn/Unsqueeze_7_output_0", "/blocks.17/self_attn/Slice_1_output_0", "/blocks.17/self_attn/Neg_output_0", "/blocks.17/self_attn/Unsqueeze_6_output_0", "/blocks.17/self_attn/Slice_output_0", "/blocks.17/self_attn/Concat_3_output_0", "/blocks.17/self_attn/Mul_1_output_0", "/blocks.17/self_attn/Add_output_0", "/blocks.17/self_attn/k_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_2_output_0", "/blocks.17/self_attn/Unsqueeze_3_output_0", "/blocks.17/self_attn/Concat_1_output_0", "/blocks.17/self_attn/Reshape_1_output_0", "/blocks.17/self_attn/Mul_2_output_0", "/blocks.17/self_attn/Shape_3_output_0", "Shape2376", "Rank2378", "BinaryOp2380", "Unsqueeze2381", "BinaryOp2383", "Unsqueeze2384", "StridedSlice2387", "Squeeze2388", "BinaryOp2389", "BinaryOp2390", "/blocks.17/self_attn/Gather_3_output_0", "/blocks.17/self_attn/Div_1_output_0", "/blocks.17/self_attn/Unsqueeze_9_output_0", "/blocks.17/self_attn/Slice_3_output_0", "/blocks.17/self_attn/Neg_1_output_0", "/blocks.17/self_attn/Unsqueeze_8_output_0", "/blocks.17/self_attn/Slice_2_output_0", "/blocks.17/self_attn/Concat_4_output_0", "/blocks.17/self_attn/Mul_3_output_0", "/blocks.17/self_attn/Add_1_output_0", "/blocks.17/self_attn/v_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_4_output_0", "/blocks.17/self_attn/Unsqueeze_5_output_0", "/blocks.17/self_attn/Concat_2_output_0", "/blocks.17/self_attn/Reshape_2_output_0", "/blocks.17/self_attn/fused_attn/FusedAttention_output_0", "/blocks.17/self_attn/o_proj/FakeLinear_output_0", "/blocks.17/Add_output_0", "/blocks.17/post_attention_layernorm/Mul_1_output_0", "/blocks.17/mlp/gate_proj/FakeLinear_output_0", "/blocks.17/mlp/act_fn/Mul_output_0", "/blocks.17/mlp/up_proj/FakeLinear_output_0", "/blocks.17/mlp/Mul_output_0", "/blocks.17/mlp/down_proj/FakeLinear_output_0", "/blocks.17/Add_1_output_0", "/blocks.18/Reshape_output_0", "/blocks.18/input_layernorm/Mul_1_output_0", "/blocks.18/self_attn/q_proj/FakeLinear_output_0", "/blocks.18/self_attn/Shape_output_0", "Shape2436", "Rank2438", "BinaryOp2440", "Unsqueeze2441", "BinaryOp2443", "Unsqueeze2444", "StridedSlice2447", "Squeeze2448", "BinaryOp2450", "/blocks.18/self_attn/Gather_output_0", "/blocks.18/self_attn/Unsqueeze_output_0", "Unsqueeze2458", "Unsqueeze2461", "StridedSlice2464", "Squeeze2465", "BinaryOp2466", "BinaryOp2467", "/blocks.18/self_attn/Gather_1_output_0", "/blocks.18/self_attn/Unsqueeze_1_output_0", "/blocks.18/self_attn/Concat_output_0", "/blocks.18/self_attn/Reshape_output_0", "/blocks.18/self_attn/Mul_output_0", "/blocks.18/self_attn/Shape_2_output_0", "Shape2474", "Rank2476", "BinaryOp2478", "Unsqueeze2479", "BinaryOp2481", "Unsqueeze2482", "StridedSlice2485", "Squeeze2486", "BinaryOp2487", "BinaryOp2488", "/blocks.18/self_attn/Gather_2_output_0", "/blocks.18/self_attn/Div_output_0", "/blocks.18/self_attn/Unsqueeze_7_output_0", "/blocks.18/self_attn/Slice_1_output_0", "/blocks.18/self_attn/Neg_output_0", "/blocks.18/self_attn/Unsqueeze_6_output_0", "/blocks.18/self_attn/Slice_output_0", "/blocks.18/self_attn/Concat_3_output_0", "/blocks.18/self_attn/Mul_1_output_0", "/blocks.18/self_attn/Add_output_0", "/blocks.18/self_attn/k_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_2_output_0", "/blocks.18/self_attn/Unsqueeze_3_output_0", "/blocks.18/self_attn/Concat_1_output_0", "/blocks.18/self_attn/Reshape_1_output_0", "/blocks.18/self_attn/Mul_2_output_0", "/blocks.18/self_attn/Shape_3_output_0", "Shape2507", "Rank2509", "BinaryOp2511", "Unsqueeze2512", "BinaryOp2514", "Unsqueeze2515", "StridedSlice2518", "Squeeze2519", "BinaryOp2520", "BinaryOp2521", "/blocks.18/self_attn/Gather_3_output_0", "/blocks.18/self_attn/Div_1_output_0", "/blocks.18/self_attn/Unsqueeze_9_output_0", "/blocks.18/self_attn/Slice_3_output_0", "/blocks.18/self_attn/Neg_1_output_0", "/blocks.18/self_attn/Unsqueeze_8_output_0", "/blocks.18/self_attn/Slice_2_output_0", "/blocks.18/self_attn/Concat_4_output_0", "/blocks.18/self_attn/Mul_3_output_0", "/blocks.18/self_attn/Add_1_output_0", "/blocks.18/self_attn/v_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_4_output_0", "/blocks.18/self_attn/Unsqueeze_5_output_0", "/blocks.18/self_attn/Concat_2_output_0", "/blocks.18/self_attn/Reshape_2_output_0", "/blocks.18/self_attn/fused_attn/FusedAttention_output_0", "/blocks.18/self_attn/o_proj/FakeLinear_output_0", "/blocks.18/Add_output_0", "/blocks.18/post_attention_layernorm/Mul_1_output_0", "/blocks.18/mlp/gate_proj/FakeLinear_output_0", "/blocks.18/mlp/act_fn/Mul_output_0", "/blocks.18/mlp/up_proj/FakeLinear_output_0", "/blocks.18/mlp/Mul_output_0", "/blocks.18/mlp/down_proj/FakeLinear_output_0", "/blocks.18/Add_1_output_0", "/blocks.19/Reshape_output_0", "/blocks.19/input_layernorm/Mul_1_output_0", "/blocks.19/self_attn/q_proj/FakeLinear_output_0", "/blocks.19/self_attn/Shape_output_0", "Shape2567", "Rank2569", "BinaryOp2571", "Unsqueeze2572", "BinaryOp2574", "Unsqueeze2575", "StridedSlice2578", "Squeeze2579", "BinaryOp2581", "/blocks.19/self_attn/Gather_output_0", "/blocks.19/self_attn/Unsqueeze_output_0", "Unsqueeze2589", "Unsqueeze2592", "StridedSlice2595", "Squeeze2596", "BinaryOp2597", "BinaryOp2598", "/blocks.19/self_attn/Gather_1_output_0", "/blocks.19/self_attn/Unsqueeze_1_output_0", "/blocks.19/self_attn/Concat_output_0", "/blocks.19/self_attn/Reshape_output_0", "/blocks.19/self_attn/Mul_output_0", "/blocks.19/self_attn/Shape_2_output_0", "Shape2605", "Rank2607", "BinaryOp2609", "Unsqueeze2610", "BinaryOp2612", "Unsqueeze2613", "StridedSlice2616", "Squeeze2617", "BinaryOp2618", "BinaryOp2619", "/blocks.19/self_attn/Gather_2_output_0", "/blocks.19/self_attn/Div_output_0", "/blocks.19/self_attn/Unsqueeze_7_output_0", "/blocks.19/self_attn/Slice_1_output_0", "/blocks.19/self_attn/Neg_output_0", "/blocks.19/self_attn/Unsqueeze_6_output_0", "/blocks.19/self_attn/Slice_output_0", "/blocks.19/self_attn/Concat_3_output_0", "/blocks.19/self_attn/Mul_1_output_0", "/blocks.19/self_attn/Add_output_0", "/blocks.19/self_attn/k_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_2_output_0", "/blocks.19/self_attn/Unsqueeze_3_output_0", "/blocks.19/self_attn/Concat_1_output_0", "/blocks.19/self_attn/Reshape_1_output_0", "/blocks.19/self_attn/Mul_2_output_0", "/blocks.19/self_attn/Shape_3_output_0", "Shape2638", "Rank2640", "BinaryOp2642", "Unsqueeze2643", "BinaryOp2645", "Unsqueeze2646", "StridedSlice2649", "Squeeze2650", "BinaryOp2651", "BinaryOp2652", "/blocks.19/self_attn/Gather_3_output_0", "/blocks.19/self_attn/Div_1_output_0", "/blocks.19/self_attn/Unsqueeze_9_output_0", "/blocks.19/self_attn/Slice_3_output_0", "/blocks.19/self_attn/Neg_1_output_0", "/blocks.19/self_attn/Unsqueeze_8_output_0", "/blocks.19/self_attn/Slice_2_output_0", "/blocks.19/self_attn/Concat_4_output_0", "/blocks.19/self_attn/Mul_3_output_0", "/blocks.19/self_attn/Add_1_output_0", "/blocks.19/self_attn/v_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_4_output_0", "/blocks.19/self_attn/Unsqueeze_5_output_0", "/blocks.19/self_attn/Concat_2_output_0", "/blocks.19/self_attn/Reshape_2_output_0", "/blocks.19/self_attn/fused_attn/FusedAttention_output_0", "/blocks.19/self_attn/o_proj/FakeLinear_output_0", "/blocks.19/Add_output_0", "/blocks.19/post_attention_layernorm/Mul_1_output_0", "/blocks.19/mlp/gate_proj/FakeLinear_output_0", "/blocks.19/mlp/act_fn/Mul_output_0", "/blocks.19/mlp/up_proj/FakeLinear_output_0", "/blocks.19/mlp/Mul_output_0", "/blocks.19/mlp/down_proj/FakeLinear_output_0", "/blocks.19/Add_1_output_0", "/blocks.20/Reshape_output_0", "/blocks.20/input_layernorm/Mul_1_output_0", "/blocks.20/self_attn/q_proj/FakeLinear_output_0", "/blocks.20/self_attn/Shape_output_0", "Shape2698", "Rank2700", "BinaryOp2702", "Unsqueeze2703", "BinaryOp2705", "Unsqueeze2706", "StridedSlice2709", "Squeeze2710", "BinaryOp2712", "/blocks.20/self_attn/Gather_output_0", "/blocks.20/self_attn/Unsqueeze_output_0", "Unsqueeze2720", "Unsqueeze2723", "StridedSlice2726", "Squeeze2727", "BinaryOp2728", "BinaryOp2729", "/blocks.20/self_attn/Gather_1_output_0", "/blocks.20/self_attn/Unsqueeze_1_output_0", "/blocks.20/self_attn/Concat_output_0", "/blocks.20/self_attn/Reshape_output_0", "/blocks.20/self_attn/Mul_output_0", "/blocks.20/self_attn/Shape_2_output_0", "Shape2736", "Rank2738", "BinaryOp2740", "Unsqueeze2741", "BinaryOp2743", "Unsqueeze2744", "StridedSlice2747", "Squeeze2748", "BinaryOp2749", "BinaryOp2750", "/blocks.20/self_attn/Gather_2_output_0", "/blocks.20/self_attn/Div_output_0", "/blocks.20/self_attn/Unsqueeze_7_output_0", "/blocks.20/self_attn/Slice_1_output_0", "/blocks.20/self_attn/Neg_output_0", "/blocks.20/self_attn/Unsqueeze_6_output_0", "/blocks.20/self_attn/Slice_output_0", "/blocks.20/self_attn/Concat_3_output_0", "/blocks.20/self_attn/Mul_1_output_0", "/blocks.20/self_attn/Add_output_0", "/blocks.20/self_attn/k_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_2_output_0", "/blocks.20/self_attn/Unsqueeze_3_output_0", "/blocks.20/self_attn/Concat_1_output_0", "/blocks.20/self_attn/Reshape_1_output_0", "/blocks.20/self_attn/Mul_2_output_0", "/blocks.20/self_attn/Shape_3_output_0", "Shape2769", "Rank2771", "BinaryOp2773", "Unsqueeze2774", "BinaryOp2776", "Unsqueeze2777", "StridedSlice2780", "Squeeze2781", "BinaryOp2782", "BinaryOp2783", "/blocks.20/self_attn/Gather_3_output_0", "/blocks.20/self_attn/Div_1_output_0", "/blocks.20/self_attn/Unsqueeze_9_output_0", "/blocks.20/self_attn/Slice_3_output_0", "/blocks.20/self_attn/Neg_1_output_0", "/blocks.20/self_attn/Unsqueeze_8_output_0", "/blocks.20/self_attn/Slice_2_output_0", "/blocks.20/self_attn/Concat_4_output_0", "/blocks.20/self_attn/Mul_3_output_0", "/blocks.20/self_attn/Add_1_output_0", "/blocks.20/self_attn/v_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_4_output_0", "/blocks.20/self_attn/Unsqueeze_5_output_0", "/blocks.20/self_attn/Concat_2_output_0", "/blocks.20/self_attn/Reshape_2_output_0", "/blocks.20/self_attn/fused_attn/FusedAttention_output_0", "/blocks.20/self_attn/o_proj/FakeLinear_output_0", "/blocks.20/Add_output_0", "/blocks.20/post_attention_layernorm/Mul_1_output_0", "/blocks.20/mlp/gate_proj/FakeLinear_output_0", "/blocks.20/mlp/act_fn/Mul_output_0", "/blocks.20/mlp/up_proj/FakeLinear_output_0", "/blocks.20/mlp/Mul_output_0", "/blocks.20/mlp/down_proj/FakeLinear_output_0", "/blocks.20/Add_1_output_0", "/blocks.21/Reshape_output_0", "/blocks.21/input_layernorm/Mul_1_output_0", "/blocks.21/self_attn/q_proj/FakeLinear_output_0", "/blocks.21/self_attn/Shape_output_0", "Shape2829", "Rank2831", "BinaryOp2833", "Unsqueeze2834", "BinaryOp2836", "Unsqueeze2837", "StridedSlice2840", "Squeeze2841", "BinaryOp2843", "/blocks.21/self_attn/Gather_output_0", "/blocks.21/self_attn/Unsqueeze_output_0", "Unsqueeze2851", "Unsqueeze2854", "StridedSlice2857", "Squeeze2858", "BinaryOp2859", "BinaryOp2860", "/blocks.21/self_attn/Gather_1_output_0", "/blocks.21/self_attn/Unsqueeze_1_output_0", "/blocks.21/self_attn/Concat_output_0", "/blocks.21/self_attn/Reshape_output_0", "/blocks.21/self_attn/Mul_output_0", "/blocks.21/self_attn/Shape_2_output_0", "Shape2867", "Rank2869", "BinaryOp2871", "Unsqueeze2872", "BinaryOp2874", "Unsqueeze2875", "StridedSlice2878", "Squeeze2879", "BinaryOp2880", "BinaryOp2881", "/blocks.21/self_attn/Gather_2_output_0", "/blocks.21/self_attn/Div_output_0", "/blocks.21/self_attn/Unsqueeze_7_output_0", "/blocks.21/self_attn/Slice_1_output_0", "/blocks.21/self_attn/Neg_output_0", "/blocks.21/self_attn/Unsqueeze_6_output_0", "/blocks.21/self_attn/Slice_output_0", "/blocks.21/self_attn/Concat_3_output_0", "/blocks.21/self_attn/Mul_1_output_0", "/blocks.21/self_attn/Add_output_0", "/blocks.21/self_attn/k_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_2_output_0", "/blocks.21/self_attn/Unsqueeze_3_output_0", "/blocks.21/self_attn/Concat_1_output_0", "/blocks.21/self_attn/Reshape_1_output_0", "/blocks.21/self_attn/Mul_2_output_0", "/blocks.21/self_attn/Shape_3_output_0", "Shape2900", "Rank2902", "BinaryOp2904", "Unsqueeze2905", "BinaryOp2907", "Unsqueeze2908", "StridedSlice2911", "Squeeze2912", "BinaryOp2913", "BinaryOp2914", "/blocks.21/self_attn/Gather_3_output_0", "/blocks.21/self_attn/Div_1_output_0", "/blocks.21/self_attn/Unsqueeze_9_output_0", "/blocks.21/self_attn/Slice_3_output_0", "/blocks.21/self_attn/Neg_1_output_0", "/blocks.21/self_attn/Unsqueeze_8_output_0", "/blocks.21/self_attn/Slice_2_output_0", "/blocks.21/self_attn/Concat_4_output_0", "/blocks.21/self_attn/Mul_3_output_0", "/blocks.21/self_attn/Add_1_output_0", "/blocks.21/self_attn/v_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_4_output_0", "/blocks.21/self_attn/Unsqueeze_5_output_0", "/blocks.21/self_attn/Concat_2_output_0", "/blocks.21/self_attn/Reshape_2_output_0", "/blocks.21/self_attn/fused_attn/FusedAttention_output_0", "/blocks.21/self_attn/o_proj/FakeLinear_output_0", "/blocks.21/Add_output_0", "/blocks.21/post_attention_layernorm/Mul_1_output_0", "/blocks.21/mlp/gate_proj/FakeLinear_output_0", "/blocks.21/mlp/act_fn/Mul_output_0", "/blocks.21/mlp/up_proj/FakeLinear_output_0", "/blocks.21/mlp/Mul_output_0", "/blocks.21/mlp/down_proj/FakeLinear_output_0", "/blocks.21/Add_1_output_0", "/blocks.22/Reshape_output_0", "/blocks.22/input_layernorm/Mul_1_output_0", "/blocks.22/self_attn/q_proj/FakeLinear_output_0", "/blocks.22/self_attn/Shape_output_0", "Shape2960", "Rank2962", "BinaryOp2964", "Unsqueeze2965", "BinaryOp2967", "Unsqueeze2968", "StridedSlice2971", "Squeeze2972", "BinaryOp2974", "/blocks.22/self_attn/Gather_output_0", "/blocks.22/self_attn/Unsqueeze_output_0", "Unsqueeze2982", "Unsqueeze2985", "StridedSlice2988", "Squeeze2989", "BinaryOp2990", "BinaryOp2991", "/blocks.22/self_attn/Gather_1_output_0", "/blocks.22/self_attn/Unsqueeze_1_output_0", "/blocks.22/self_attn/Concat_output_0", "/blocks.22/self_attn/Reshape_output_0", "/blocks.22/self_attn/Mul_output_0", "/blocks.22/self_attn/Shape_2_output_0", "Shape2998", "Rank3000", "BinaryOp3002", "Unsqueeze3003", "BinaryOp3005", "Unsqueeze3006", "StridedSlice3009", "Squeeze3010", "BinaryOp3011", "BinaryOp3012", "/blocks.22/self_attn/Gather_2_output_0", "/blocks.22/self_attn/Div_output_0", "/blocks.22/self_attn/Unsqueeze_7_output_0", "/blocks.22/self_attn/Slice_1_output_0", "/blocks.22/self_attn/Neg_output_0", "/blocks.22/self_attn/Unsqueeze_6_output_0", "/blocks.22/self_attn/Slice_output_0", "/blocks.22/self_attn/Concat_3_output_0", "/blocks.22/self_attn/Mul_1_output_0", "/blocks.22/self_attn/Add_output_0", "/blocks.22/self_attn/k_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_2_output_0", "/blocks.22/self_attn/Unsqueeze_3_output_0", "/blocks.22/self_attn/Concat_1_output_0", "/blocks.22/self_attn/Reshape_1_output_0", "/blocks.22/self_attn/Mul_2_output_0", "/blocks.22/self_attn/Shape_3_output_0", "Shape3031", "Rank3033", "BinaryOp3035", "Unsqueeze3036", "BinaryOp3038", "Unsqueeze3039", "StridedSlice3042", "Squeeze3043", "BinaryOp3044", "BinaryOp3045", "/blocks.22/self_attn/Gather_3_output_0", "/blocks.22/self_attn/Div_1_output_0", "/blocks.22/self_attn/Unsqueeze_9_output_0", "/blocks.22/self_attn/Slice_3_output_0", "/blocks.22/self_attn/Neg_1_output_0", "/blocks.22/self_attn/Unsqueeze_8_output_0", "/blocks.22/self_attn/Slice_2_output_0", "/blocks.22/self_attn/Concat_4_output_0", "/blocks.22/self_attn/Mul_3_output_0", "/blocks.22/self_attn/Add_1_output_0", "/blocks.22/self_attn/v_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_4_output_0", "/blocks.22/self_attn/Unsqueeze_5_output_0", "/blocks.22/self_attn/Concat_2_output_0", "/blocks.22/self_attn/Reshape_2_output_0", "/blocks.22/self_attn/fused_attn/FusedAttention_output_0", "/blocks.22/self_attn/o_proj/FakeLinear_output_0", "/blocks.22/Add_output_0", "/blocks.22/post_attention_layernorm/Mul_1_output_0", "/blocks.22/mlp/gate_proj/FakeLinear_output_0", "/blocks.22/mlp/act_fn/Mul_output_0", "/blocks.22/mlp/up_proj/FakeLinear_output_0", "/blocks.22/mlp/Mul_output_0", "/blocks.22/mlp/down_proj/FakeLinear_output_0", "/blocks.22/Add_1_output_0", "/blocks.23/Reshape_output_0", "/blocks.23/input_layernorm/Mul_1_output_0", "/blocks.23/self_attn/q_proj/FakeLinear_output_0", "/blocks.23/self_attn/Shape_output_0", "Shape3091", "Rank3093", "BinaryOp3095", "Unsqueeze3096", "BinaryOp3098", "Unsqueeze3099", "StridedSlice3102", "Squeeze3103", "BinaryOp3105", "/blocks.23/self_attn/Gather_output_0", "/blocks.23/self_attn/Unsqueeze_output_0", "Unsqueeze3113", "Unsqueeze3116", "StridedSlice3119", "Squeeze3120", "BinaryOp3121", "BinaryOp3122", "/blocks.23/self_attn/Gather_1_output_0", "/blocks.23/self_attn/Unsqueeze_1_output_0", "/blocks.23/self_attn/Concat_output_0", "/blocks.23/self_attn/Reshape_output_0", "/blocks.23/self_attn/Mul_output_0", "/blocks.23/self_attn/Shape_2_output_0", "Shape3129", "Rank3131", "BinaryOp3133", "Unsqueeze3134", "BinaryOp3136", "Unsqueeze3137", "StridedSlice3140", "Squeeze3141", "BinaryOp3142", "BinaryOp3143", "/blocks.23/self_attn/Gather_2_output_0", "/blocks.23/self_attn/Div_output_0", "/blocks.23/self_attn/Unsqueeze_7_output_0", "/blocks.23/self_attn/Slice_1_output_0", "/blocks.23/self_attn/Neg_output_0", "/blocks.23/self_attn/Unsqueeze_6_output_0", "/blocks.23/self_attn/Slice_output_0", "/blocks.23/self_attn/Concat_3_output_0", "/blocks.23/self_attn/Mul_1_output_0", "/blocks.23/self_attn/Add_output_0", "/blocks.23/self_attn/k_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_2_output_0", "/blocks.23/self_attn/Unsqueeze_3_output_0", "/blocks.23/self_attn/Concat_1_output_0", "/blocks.23/self_attn/Reshape_1_output_0", "/blocks.23/self_attn/Mul_2_output_0", "/blocks.23/self_attn/Shape_3_output_0", "Shape3162", "Rank3164", "BinaryOp3166", "Unsqueeze3167", "BinaryOp3169", "Unsqueeze3170", "StridedSlice3173", "Squeeze3174", "BinaryOp3175", "BinaryOp3176", "/blocks.23/self_attn/Gather_3_output_0", "/blocks.23/self_attn/Div_1_output_0", "/blocks.23/self_attn/Unsqueeze_9_output_0", "/blocks.23/self_attn/Slice_3_output_0", "/blocks.23/self_attn/Neg_1_output_0", "/blocks.23/self_attn/Unsqueeze_8_output_0", "/blocks.23/self_attn/Slice_2_output_0", "/blocks.23/self_attn/Concat_4_output_0", "/blocks.23/self_attn/Mul_3_output_0", "/blocks.23/self_attn/Add_1_output_0", "/blocks.23/self_attn/v_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_4_output_0", "/blocks.23/self_attn/Unsqueeze_5_output_0", "/blocks.23/self_attn/Concat_2_output_0", "/blocks.23/self_attn/Reshape_2_output_0", "/blocks.23/self_attn/fused_attn/FusedAttention_output_0", "/blocks.23/self_attn/o_proj/FakeLinear_output_0", "/blocks.23/Add_output_0", "/blocks.23/post_attention_layernorm/Mul_1_output_0", "/blocks.23/mlp/gate_proj/FakeLinear_output_0", "/blocks.23/mlp/act_fn/Mul_output_0", "/blocks.23/mlp/up_proj/FakeLinear_output_0", "/blocks.23/mlp/Mul_output_0", "/blocks.23/mlp/down_proj/FakeLinear_output_0", "/blocks.23/Add_1_output_0", "/blocks.24/Reshape_output_0", "/blocks.24/input_layernorm/Mul_1_output_0", "/blocks.24/self_attn/q_proj/FakeLinear_output_0", "/blocks.24/self_attn/Shape_output_0", "Shape3222", "Rank3224", "BinaryOp3226", "Unsqueeze3227", "BinaryOp3229", "Unsqueeze3230", "StridedSlice3233", "Squeeze3234", "BinaryOp3236", "/blocks.24/self_attn/Gather_output_0", "/blocks.24/self_attn/Unsqueeze_output_0", "Unsqueeze3244", "Unsqueeze3247", "StridedSlice3250", "Squeeze3251", "BinaryOp3252", "BinaryOp3253", "/blocks.24/self_attn/Gather_1_output_0", "/blocks.24/self_attn/Unsqueeze_1_output_0", "/blocks.24/self_attn/Concat_output_0", "/blocks.24/self_attn/Reshape_output_0", "/blocks.24/self_attn/Mul_output_0", "/blocks.24/self_attn/Shape_2_output_0", "Shape3260", "Rank3262", "BinaryOp3264", "Unsqueeze3265", "BinaryOp3267", "Unsqueeze3268", "StridedSlice3271", "Squeeze3272", "BinaryOp3273", "BinaryOp3274", "/blocks.24/self_attn/Gather_2_output_0", "/blocks.24/self_attn/Div_output_0", "/blocks.24/self_attn/Unsqueeze_7_output_0", "/blocks.24/self_attn/Slice_1_output_0", "/blocks.24/self_attn/Neg_output_0", "/blocks.24/self_attn/Unsqueeze_6_output_0", "/blocks.24/self_attn/Slice_output_0", "/blocks.24/self_attn/Concat_3_output_0", "/blocks.24/self_attn/Mul_1_output_0", "/blocks.24/self_attn/Add_output_0", "/blocks.24/self_attn/k_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_2_output_0", "/blocks.24/self_attn/Unsqueeze_3_output_0", "/blocks.24/self_attn/Concat_1_output_0", "/blocks.24/self_attn/Reshape_1_output_0", "/blocks.24/self_attn/Mul_2_output_0", "/blocks.24/self_attn/Shape_3_output_0", "Shape3293", "Rank3295", "BinaryOp3297", "Unsqueeze3298", "BinaryOp3300", "Unsqueeze3301", "StridedSlice3304", "Squeeze3305", "BinaryOp3306", "BinaryOp3307", "/blocks.24/self_attn/Gather_3_output_0", "/blocks.24/self_attn/Div_1_output_0", "/blocks.24/self_attn/Unsqueeze_9_output_0", "/blocks.24/self_attn/Slice_3_output_0", "/blocks.24/self_attn/Neg_1_output_0", "/blocks.24/self_attn/Unsqueeze_8_output_0", "/blocks.24/self_attn/Slice_2_output_0", "/blocks.24/self_attn/Concat_4_output_0", "/blocks.24/self_attn/Mul_3_output_0", "/blocks.24/self_attn/Add_1_output_0", "/blocks.24/self_attn/v_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_4_output_0", "/blocks.24/self_attn/Unsqueeze_5_output_0", "/blocks.24/self_attn/Concat_2_output_0", "/blocks.24/self_attn/Reshape_2_output_0", "/blocks.24/self_attn/fused_attn/FusedAttention_output_0", "/blocks.24/self_attn/o_proj/FakeLinear_output_0", "/blocks.24/Add_output_0", "/blocks.24/post_attention_layernorm/Mul_1_output_0", "/blocks.24/mlp/gate_proj/FakeLinear_output_0", "/blocks.24/mlp/act_fn/Mul_output_0", "/blocks.24/mlp/up_proj/FakeLinear_output_0", "/blocks.24/mlp/Mul_output_0", "/blocks.24/mlp/down_proj/FakeLinear_output_0", "/blocks.24/Add_1_output_0", "/blocks.25/Reshape_output_0", "/blocks.25/input_layernorm/Mul_1_output_0", "/blocks.25/self_attn/q_proj/FakeLinear_output_0", "/blocks.25/self_attn/Shape_output_0", "Shape3353", "Rank3355", "BinaryOp3357", "Unsqueeze3358", "BinaryOp3360", "Unsqueeze3361", "StridedSlice3364", "Squeeze3365", "BinaryOp3367", "/blocks.25/self_attn/Gather_output_0", "/blocks.25/self_attn/Unsqueeze_output_0", "Unsqueeze3375", "Unsqueeze3378", "StridedSlice3381", "Squeeze3382", "BinaryOp3383", "BinaryOp3384", "/blocks.25/self_attn/Gather_1_output_0", "/blocks.25/self_attn/Unsqueeze_1_output_0", "/blocks.25/self_attn/Concat_output_0", "/blocks.25/self_attn/Reshape_output_0", "/blocks.25/self_attn/Mul_output_0", "/blocks.25/self_attn/Shape_2_output_0", "Shape3391", "Rank3393", "BinaryOp3395", "Unsqueeze3396", "BinaryOp3398", "Unsqueeze3399", "StridedSlice3402", "Squeeze3403", "BinaryOp3404", "BinaryOp3405", "/blocks.25/self_attn/Gather_2_output_0", "/blocks.25/self_attn/Div_output_0", "/blocks.25/self_attn/Unsqueeze_7_output_0", "/blocks.25/self_attn/Slice_1_output_0", "/blocks.25/self_attn/Neg_output_0", "/blocks.25/self_attn/Unsqueeze_6_output_0", "/blocks.25/self_attn/Slice_output_0", "/blocks.25/self_attn/Concat_3_output_0", "/blocks.25/self_attn/Mul_1_output_0", "/blocks.25/self_attn/Add_output_0", "/blocks.25/self_attn/k_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_2_output_0", "/blocks.25/self_attn/Unsqueeze_3_output_0", "/blocks.25/self_attn/Concat_1_output_0", "/blocks.25/self_attn/Reshape_1_output_0", "/blocks.25/self_attn/Mul_2_output_0", "/blocks.25/self_attn/Shape_3_output_0", "Shape3424", "Rank3426", "BinaryOp3428", "Unsqueeze3429", "BinaryOp3431", "Unsqueeze3432", "StridedSlice3435", "Squeeze3436", "BinaryOp3437", "BinaryOp3438", "/blocks.25/self_attn/Gather_3_output_0", "/blocks.25/self_attn/Div_1_output_0", "/blocks.25/self_attn/Unsqueeze_9_output_0", "/blocks.25/self_attn/Slice_3_output_0", "/blocks.25/self_attn/Neg_1_output_0", "/blocks.25/self_attn/Unsqueeze_8_output_0", "/blocks.25/self_attn/Slice_2_output_0", "/blocks.25/self_attn/Concat_4_output_0", "/blocks.25/self_attn/Mul_3_output_0", "/blocks.25/self_attn/Add_1_output_0", "/blocks.25/self_attn/v_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_4_output_0", "/blocks.25/self_attn/Unsqueeze_5_output_0", "/blocks.25/self_attn/Concat_2_output_0", "/blocks.25/self_attn/Reshape_2_output_0", "/blocks.25/self_attn/fused_attn/FusedAttention_output_0", "/blocks.25/self_attn/o_proj/FakeLinear_output_0", "/blocks.25/Add_output_0", "/blocks.25/post_attention_layernorm/Mul_1_output_0", "/blocks.25/mlp/gate_proj/FakeLinear_output_0", "/blocks.25/mlp/act_fn/Mul_output_0", "/blocks.25/mlp/up_proj/FakeLinear_output_0", "/blocks.25/mlp/Mul_output_0", "/blocks.25/mlp/down_proj/FakeLinear_output_0", "/blocks.25/Add_1_output_0", "/blocks.26/Reshape_output_0", "/blocks.26/input_layernorm/Mul_1_output_0", "/blocks.26/self_attn/q_proj/FakeLinear_output_0", "/blocks.26/self_attn/Shape_output_0", "Shape3484", "Rank3486", "BinaryOp3488", "Unsqueeze3489", "BinaryOp3491", "Unsqueeze3492", "StridedSlice3495", "Squeeze3496", "BinaryOp3498", "/blocks.26/self_attn/Gather_output_0", "/blocks.26/self_attn/Unsqueeze_output_0", "Unsqueeze3506", "Unsqueeze3509", "StridedSlice3512", "Squeeze3513", "BinaryOp3514", "BinaryOp3515", "/blocks.26/self_attn/Gather_1_output_0", "/blocks.26/self_attn/Unsqueeze_1_output_0", "/blocks.26/self_attn/Concat_output_0", "/blocks.26/self_attn/Reshape_output_0", "/blocks.26/self_attn/Mul_output_0", "/blocks.26/self_attn/Shape_2_output_0", "Shape3522", "Rank3524", "BinaryOp3526", "Unsqueeze3527", "BinaryOp3529", "Unsqueeze3530", "StridedSlice3533", "Squeeze3534", "BinaryOp3535", "BinaryOp3536", "/blocks.26/self_attn/Gather_2_output_0", "/blocks.26/self_attn/Div_output_0", "/blocks.26/self_attn/Unsqueeze_7_output_0", "/blocks.26/self_attn/Slice_1_output_0", "/blocks.26/self_attn/Neg_output_0", "/blocks.26/self_attn/Unsqueeze_6_output_0", "/blocks.26/self_attn/Slice_output_0", "/blocks.26/self_attn/Concat_3_output_0", "/blocks.26/self_attn/Mul_1_output_0", "/blocks.26/self_attn/Add_output_0", "/blocks.26/self_attn/k_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_2_output_0", "/blocks.26/self_attn/Unsqueeze_3_output_0", "/blocks.26/self_attn/Concat_1_output_0", "/blocks.26/self_attn/Reshape_1_output_0", "/blocks.26/self_attn/Mul_2_output_0", "/blocks.26/self_attn/Shape_3_output_0", "Shape3555", "Rank3557", "BinaryOp3559", "Unsqueeze3560", "BinaryOp3562", "Unsqueeze3563", "StridedSlice3566", "Squeeze3567", "BinaryOp3568", "BinaryOp3569", "/blocks.26/self_attn/Gather_3_output_0", "/blocks.26/self_attn/Div_1_output_0", "/blocks.26/self_attn/Unsqueeze_9_output_0", "/blocks.26/self_attn/Slice_3_output_0", "/blocks.26/self_attn/Neg_1_output_0", "/blocks.26/self_attn/Unsqueeze_8_output_0", "/blocks.26/self_attn/Slice_2_output_0", "/blocks.26/self_attn/Concat_4_output_0", "/blocks.26/self_attn/Mul_3_output_0", "/blocks.26/self_attn/Add_1_output_0", "/blocks.26/self_attn/v_proj/FakeLinear_output_0", "/blocks.26/self_attn/Unsqueeze_4_output_0", "/blocks.26/self_attn/Unsqueeze_5_output_0", "/blocks.26/self_attn/Concat_2_output_0", "/blocks.26/self_attn/Reshape_2_output_0", "/blocks.26/self_attn/fused_attn/FusedAttention_output_0", "/blocks.26/self_attn/o_proj/FakeLinear_output_0", "/blocks.26/Add_output_0", "/blocks.26/post_attention_layernorm/Mul_1_output_0", "/blocks.26/mlp/gate_proj/FakeLinear_output_0", "/blocks.26/mlp/act_fn/Mul_output_0", "/blocks.26/mlp/up_proj/FakeLinear_output_0", "/blocks.26/mlp/Mul_output_0", "/blocks.26/mlp/down_proj/FakeLinear_output_0", "/blocks.26/Add_1_output_0", "/blocks.27/Reshape_output_0", "/blocks.27/input_layernorm/Mul_1_output_0", "/blocks.27/self_attn/q_proj/FakeLinear_output_0", "/blocks.27/self_attn/Shape_output_0", "Shape3615", "Rank3617", "BinaryOp3619", "Unsqueeze3620", "BinaryOp3622", "Unsqueeze3623", "StridedSlice3626", "Squeeze3627", "BinaryOp3629", "/blocks.27/self_attn/Gather_output_0", "/blocks.27/self_attn/Unsqueeze_output_0", "Unsqueeze3637", "Unsqueeze3640", "StridedSlice3643", "Squeeze3644", "BinaryOp3645", "BinaryOp3646", "/blocks.27/self_attn/Gather_1_output_0", "/blocks.27/self_attn/Unsqueeze_1_output_0", "/blocks.27/self_attn/Concat_output_0", "/blocks.27/self_attn/Reshape_output_0", "/blocks.27/self_attn/Mul_output_0", "/blocks.27/self_attn/Shape_2_output_0", "Shape3653", "Rank3655", "BinaryOp3657", "Unsqueeze3658", "BinaryOp3660", "Unsqueeze3661", "StridedSlice3664", "Squeeze3665", "BinaryOp3666", "BinaryOp3667", "/blocks.27/self_attn/Gather_2_output_0", "/blocks.27/self_attn/Div_output_0", "/blocks.27/self_attn/Unsqueeze_7_output_0", "/blocks.27/self_attn/Slice_1_output_0", "/blocks.27/self_attn/Neg_output_0", "/blocks.27/self_attn/Unsqueeze_6_output_0", "/blocks.27/self_attn/Slice_output_0", "/blocks.27/self_attn/Concat_3_output_0", "/blocks.27/self_attn/Mul_1_output_0", "/blocks.27/self_attn/Add_output_0", "/blocks.27/self_attn/k_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_2_output_0", "/blocks.27/self_attn/Unsqueeze_3_output_0", "/blocks.27/self_attn/Concat_1_output_0", "/blocks.27/self_attn/Reshape_1_output_0", "/blocks.27/self_attn/Mul_2_output_0", "/blocks.27/self_attn/Shape_3_output_0", "Shape3686", "Rank3688", "BinaryOp3690", "Unsqueeze3691", "BinaryOp3693", "Unsqueeze3694", "StridedSlice3697", "Squeeze3698", "BinaryOp3699", "BinaryOp3700", "/blocks.27/self_attn/Gather_3_output_0", "/blocks.27/self_attn/Div_1_output_0", "/blocks.27/self_attn/Unsqueeze_9_output_0", "/blocks.27/self_attn/Slice_3_output_0", "/blocks.27/self_attn/Neg_1_output_0", "/blocks.27/self_attn/Unsqueeze_8_output_0", "/blocks.27/self_attn/Slice_2_output_0", "/blocks.27/self_attn/Concat_4_output_0", "/blocks.27/self_attn/Mul_3_output_0", "/blocks.27/self_attn/Add_1_output_0", "/blocks.27/self_attn/v_proj/FakeLinear_output_0", "/blocks.27/self_attn/Unsqueeze_4_output_0", "/blocks.27/self_attn/Unsqueeze_5_output_0", "/blocks.27/self_attn/Concat_2_output_0", "/blocks.27/self_attn/Reshape_2_output_0", "/blocks.27/self_attn/fused_attn/FusedAttention_output_0", "/blocks.27/self_attn/o_proj/FakeLinear_output_0", "/blocks.27/Add_output_0", "/blocks.27/post_attention_layernorm/Mul_1_output_0", "/blocks.27/mlp/gate_proj/FakeLinear_output_0", "/blocks.27/mlp/act_fn/Mul_output_0", "/blocks.27/mlp/up_proj/FakeLinear_output_0", "/blocks.27/mlp/Mul_output_0", "/blocks.27/mlp/down_proj/FakeLinear_output_0", "/blocks.27/Add_1_output_0", "/blocks.28/Reshape_output_0", "/blocks.28/input_layernorm/Mul_1_output_0", "/blocks.28/self_attn/q_proj/FakeLinear_output_0", "/blocks.28/self_attn/Shape_output_0", "Shape3746", "Rank3748", "BinaryOp3750", "Unsqueeze3751", "BinaryOp3753", "Unsqueeze3754", "StridedSlice3757", "Squeeze3758", "BinaryOp3760", "/blocks.28/self_attn/Gather_output_0", "/blocks.28/self_attn/Unsqueeze_output_0", "Unsqueeze3768", "Unsqueeze3771", "StridedSlice3774", "Squeeze3775", "BinaryOp3776", "BinaryOp3777", "/blocks.28/self_attn/Gather_1_output_0", "/blocks.28/self_attn/Unsqueeze_1_output_0", "/blocks.28/self_attn/Concat_output_0", "/blocks.28/self_attn/Reshape_output_0", "/blocks.28/self_attn/Mul_output_0", "/blocks.28/self_attn/Shape_2_output_0", "Shape3784", "Rank3786", "BinaryOp3788", "Unsqueeze3789", "BinaryOp3791", "Unsqueeze3792", "StridedSlice3795", "Squeeze3796", "BinaryOp3797", "BinaryOp3798", "/blocks.28/self_attn/Gather_2_output_0", "/blocks.28/self_attn/Div_output_0", "/blocks.28/self_attn/Unsqueeze_7_output_0", "/blocks.28/self_attn/Slice_1_output_0", "/blocks.28/self_attn/Neg_output_0", "/blocks.28/self_attn/Unsqueeze_6_output_0", "/blocks.28/self_attn/Slice_output_0", "/blocks.28/self_attn/Concat_3_output_0", "/blocks.28/self_attn/Mul_1_output_0", "/blocks.28/self_attn/Add_output_0", "/blocks.28/self_attn/k_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_2_output_0", "/blocks.28/self_attn/Unsqueeze_3_output_0", "/blocks.28/self_attn/Concat_1_output_0", "/blocks.28/self_attn/Reshape_1_output_0", "/blocks.28/self_attn/Mul_2_output_0", "/blocks.28/self_attn/Shape_3_output_0", "Shape3817", "Rank3819", "BinaryOp3821", "Unsqueeze3822", "BinaryOp3824", "Unsqueeze3825", "StridedSlice3828", "Squeeze3829", "BinaryOp3830", "BinaryOp3831", "/blocks.28/self_attn/Gather_3_output_0", "/blocks.28/self_attn/Div_1_output_0", "/blocks.28/self_attn/Unsqueeze_9_output_0", "/blocks.28/self_attn/Slice_3_output_0", "/blocks.28/self_attn/Neg_1_output_0", "/blocks.28/self_attn/Unsqueeze_8_output_0", "/blocks.28/self_attn/Slice_2_output_0", "/blocks.28/self_attn/Concat_4_output_0", "/blocks.28/self_attn/Mul_3_output_0", "/blocks.28/self_attn/Add_1_output_0", "/blocks.28/self_attn/v_proj/FakeLinear_output_0", "/blocks.28/self_attn/Unsqueeze_4_output_0", "/blocks.28/self_attn/Unsqueeze_5_output_0", "/blocks.28/self_attn/Concat_2_output_0", "/blocks.28/self_attn/Reshape_2_output_0", "/blocks.28/self_attn/fused_attn/FusedAttention_output_0", "/blocks.28/self_attn/o_proj/FakeLinear_output_0", "/blocks.28/Add_output_0", "/blocks.28/post_attention_layernorm/Mul_1_output_0", "/blocks.28/mlp/gate_proj/FakeLinear_output_0", "/blocks.28/mlp/act_fn/Mul_output_0", "/blocks.28/mlp/up_proj/FakeLinear_output_0", "/blocks.28/mlp/Mul_output_0", "/blocks.28/mlp/down_proj/FakeLinear_output_0", "/blocks.28/Add_1_output_0", "/blocks.29/Reshape_output_0", "/blocks.29/input_layernorm/Mul_1_output_0", "/blocks.29/self_attn/q_proj/FakeLinear_output_0", "/blocks.29/self_attn/Shape_output_0", "Shape3877", "Rank3879", "BinaryOp3881", "Unsqueeze3882", "BinaryOp3884", "Unsqueeze3885", "StridedSlice3888", "Squeeze3889", "BinaryOp3891", "/blocks.29/self_attn/Gather_output_0", "/blocks.29/self_attn/Unsqueeze_output_0", "Unsqueeze3899", "Unsqueeze3902", "StridedSlice3905", "Squeeze3906", "BinaryOp3907", "BinaryOp3908", "/blocks.29/self_attn/Gather_1_output_0", "/blocks.29/self_attn/Unsqueeze_1_output_0", "/blocks.29/self_attn/Concat_output_0", "/blocks.29/self_attn/Reshape_output_0", "/blocks.29/self_attn/Mul_output_0", "/blocks.29/self_attn/Shape_2_output_0", "Shape3915", "Rank3917", "BinaryOp3919", "Unsqueeze3920", "BinaryOp3922", "Unsqueeze3923", "StridedSlice3926", "Squeeze3927", "BinaryOp3928", "BinaryOp3929", "/blocks.29/self_attn/Gather_2_output_0", "/blocks.29/self_attn/Div_output_0", "/blocks.29/self_attn/Unsqueeze_7_output_0", "/blocks.29/self_attn/Slice_1_output_0", "/blocks.29/self_attn/Neg_output_0", "/blocks.29/self_attn/Unsqueeze_6_output_0", "/blocks.29/self_attn/Slice_output_0", "/blocks.29/self_attn/Concat_3_output_0", "/blocks.29/self_attn/Mul_1_output_0", "/blocks.29/self_attn/Add_output_0", "/blocks.29/self_attn/k_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_2_output_0", "/blocks.29/self_attn/Unsqueeze_3_output_0", "/blocks.29/self_attn/Concat_1_output_0", "/blocks.29/self_attn/Reshape_1_output_0", "/blocks.29/self_attn/Mul_2_output_0", "/blocks.29/self_attn/Shape_3_output_0", "Shape3948", "Rank3950", "BinaryOp3952", "Unsqueeze3953", "BinaryOp3955", "Unsqueeze3956", "StridedSlice3959", "Squeeze3960", "BinaryOp3961", "BinaryOp3962", "/blocks.29/self_attn/Gather_3_output_0", "/blocks.29/self_attn/Div_1_output_0", "/blocks.29/self_attn/Unsqueeze_9_output_0", "/blocks.29/self_attn/Slice_3_output_0", "/blocks.29/self_attn/Neg_1_output_0", "/blocks.29/self_attn/Unsqueeze_8_output_0", "/blocks.29/self_attn/Slice_2_output_0", "/blocks.29/self_attn/Concat_4_output_0", "/blocks.29/self_attn/Mul_3_output_0", "/blocks.29/self_attn/Add_1_output_0", "/blocks.29/self_attn/v_proj/FakeLinear_output_0", "/blocks.29/self_attn/Unsqueeze_4_output_0", "/blocks.29/self_attn/Unsqueeze_5_output_0", "/blocks.29/self_attn/Concat_2_output_0", "/blocks.29/self_attn/Reshape_2_output_0", "/blocks.29/self_attn/fused_attn/FusedAttention_output_0", "/blocks.29/self_attn/o_proj/FakeLinear_output_0", "/blocks.29/Add_output_0", "/blocks.29/post_attention_layernorm/Mul_1_output_0", "/blocks.29/mlp/gate_proj/FakeLinear_output_0", "/blocks.29/mlp/act_fn/Mul_output_0", "/blocks.29/mlp/up_proj/FakeLinear_output_0", "/blocks.29/mlp/Mul_output_0", "/blocks.29/mlp/down_proj/FakeLinear_output_0", "/blocks.29/Add_1_output_0", "/blocks.30/Reshape_output_0", "/blocks.30/input_layernorm/Mul_1_output_0", "/blocks.30/self_attn/q_proj/FakeLinear_output_0", "/blocks.30/self_attn/Shape_output_0", "Shape4008", "Rank4010", "BinaryOp4012", "Unsqueeze4013", "BinaryOp4015", "Unsqueeze4016", "StridedSlice4019", "Squeeze4020", "BinaryOp4022", "/blocks.30/self_attn/Gather_output_0", "/blocks.30/self_attn/Unsqueeze_output_0", "Unsqueeze4030", "Unsqueeze4033", "StridedSlice4036", "Squeeze4037", "BinaryOp4038", "BinaryOp4039", "/blocks.30/self_attn/Gather_1_output_0", "/blocks.30/self_attn/Unsqueeze_1_output_0", "/blocks.30/self_attn/Concat_output_0", "/blocks.30/self_attn/Reshape_output_0", "/blocks.30/self_attn/Mul_output_0", "/blocks.30/self_attn/Shape_2_output_0", "Shape4046", "Rank4048", "BinaryOp4050", "Unsqueeze4051", "BinaryOp4053", "Unsqueeze4054", "StridedSlice4057", "Squeeze4058", "BinaryOp4059", "BinaryOp4060", "/blocks.30/self_attn/Gather_2_output_0", "/blocks.30/self_attn/Div_output_0", "/blocks.30/self_attn/Unsqueeze_7_output_0", "/blocks.30/self_attn/Slice_1_output_0", "/blocks.30/self_attn/Neg_output_0", "/blocks.30/self_attn/Unsqueeze_6_output_0", "/blocks.30/self_attn/Slice_output_0", "/blocks.30/self_attn/Concat_3_output_0", "/blocks.30/self_attn/Mul_1_output_0", "/blocks.30/self_attn/Add_output_0", "/blocks.30/self_attn/k_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_2_output_0", "/blocks.30/self_attn/Unsqueeze_3_output_0", "/blocks.30/self_attn/Concat_1_output_0", "/blocks.30/self_attn/Reshape_1_output_0", "/blocks.30/self_attn/Mul_2_output_0", "/blocks.30/self_attn/Shape_3_output_0", "Shape4079", "Rank4081", "BinaryOp4083", "Unsqueeze4084", "BinaryOp4086", "Unsqueeze4087", "StridedSlice4090", "Squeeze4091", "BinaryOp4092", "BinaryOp4093", "/blocks.30/self_attn/Gather_3_output_0", "/blocks.30/self_attn/Div_1_output_0", "/blocks.30/self_attn/Unsqueeze_9_output_0", "/blocks.30/self_attn/Slice_3_output_0", "/blocks.30/self_attn/Neg_1_output_0", "/blocks.30/self_attn/Unsqueeze_8_output_0", "/blocks.30/self_attn/Slice_2_output_0", "/blocks.30/self_attn/Concat_4_output_0", "/blocks.30/self_attn/Mul_3_output_0", "/blocks.30/self_attn/Add_1_output_0", "/blocks.30/self_attn/v_proj/FakeLinear_output_0", "/blocks.30/self_attn/Unsqueeze_4_output_0", "/blocks.30/self_attn/Unsqueeze_5_output_0", "/blocks.30/self_attn/Concat_2_output_0", "/blocks.30/self_attn/Reshape_2_output_0", "/blocks.30/self_attn/fused_attn/FusedAttention_output_0", "/blocks.30/self_attn/o_proj/FakeLinear_output_0", "/blocks.30/Add_output_0", "/blocks.30/post_attention_layernorm/Mul_1_output_0", "/blocks.30/mlp/gate_proj/FakeLinear_output_0", "/blocks.30/mlp/act_fn/Mul_output_0", "/blocks.30/mlp/up_proj/FakeLinear_output_0", "/blocks.30/mlp/Mul_output_0", "/blocks.30/mlp/down_proj/FakeLinear_output_0", "/blocks.30/Add_1_output_0", "/blocks.31/Reshape_output_0", "/blocks.31/input_layernorm/Mul_1_output_0", "/blocks.31/self_attn/q_proj/FakeLinear_output_0", "/blocks.31/self_attn/Shape_output_0", "Shape4139", "Rank4141", "BinaryOp4143", "Unsqueeze4144", "BinaryOp4146", "Unsqueeze4147", "StridedSlice4150", "Squeeze4151", "BinaryOp4153", "/blocks.31/self_attn/Gather_output_0", "/blocks.31/self_attn/Unsqueeze_output_0", "Unsqueeze4161", "Unsqueeze4164", "StridedSlice4167", "Squeeze4168", "BinaryOp4169", "BinaryOp4170", "/blocks.31/self_attn/Gather_1_output_0", "/blocks.31/self_attn/Unsqueeze_1_output_0", "/blocks.31/self_attn/Concat_output_0", "/blocks.31/self_attn/Reshape_output_0", "/blocks.31/self_attn/Mul_output_0", "/blocks.31/self_attn/Shape_2_output_0", "Shape4177", "Rank4179", "BinaryOp4181", "Unsqueeze4182", "BinaryOp4184", "Unsqueeze4185", "StridedSlice4188", "Squeeze4189", "BinaryOp4190", "BinaryOp4191", "/blocks.31/self_attn/Gather_2_output_0", "/blocks.31/self_attn/Div_output_0", "/blocks.31/self_attn/Unsqueeze_7_output_0", "/blocks.31/self_attn/Slice_1_output_0", "/blocks.31/self_attn/Neg_output_0", "/blocks.31/self_attn/Unsqueeze_6_output_0", "/blocks.31/self_attn/Slice_output_0", "/blocks.31/self_attn/Concat_3_output_0", "/blocks.31/self_attn/Mul_1_output_0", "/blocks.31/self_attn/Add_output_0", "/blocks.31/self_attn/k_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_2_output_0", "/blocks.31/self_attn/Unsqueeze_3_output_0", "/blocks.31/self_attn/Concat_1_output_0", "/blocks.31/self_attn/Reshape_1_output_0", "/blocks.31/self_attn/Mul_2_output_0", "/blocks.31/self_attn/Shape_3_output_0", "Shape4210", "Rank4212", "BinaryOp4214", "Unsqueeze4215", "BinaryOp4217", "Unsqueeze4218", "StridedSlice4221", "Squeeze4222", "BinaryOp4223", "BinaryOp4224", "/blocks.31/self_attn/Gather_3_output_0", "/blocks.31/self_attn/Div_1_output_0", "/blocks.31/self_attn/Unsqueeze_9_output_0", "/blocks.31/self_attn/Slice_3_output_0", "/blocks.31/self_attn/Neg_1_output_0", "/blocks.31/self_attn/Unsqueeze_8_output_0", "/blocks.31/self_attn/Slice_2_output_0", "/blocks.31/self_attn/Concat_4_output_0", "/blocks.31/self_attn/Mul_3_output_0", "/blocks.31/self_attn/Add_1_output_0", "/blocks.31/self_attn/v_proj/FakeLinear_output_0", "/blocks.31/self_attn/Unsqueeze_4_output_0", "/blocks.31/self_attn/Unsqueeze_5_output_0", "/blocks.31/self_attn/Concat_2_output_0", "/blocks.31/self_attn/Reshape_2_output_0", "/blocks.31/self_attn/fused_attn/FusedAttention_output_0", "/blocks.31/self_attn/o_proj/FakeLinear_output_0", "/blocks.31/Add_output_0", "/blocks.31/post_attention_layernorm/Mul_1_output_0", "/blocks.31/mlp/gate_proj/FakeLinear_output_0", "/blocks.31/mlp/act_fn/Mul_output_0", "/blocks.31/mlp/up_proj/FakeLinear_output_0", "/blocks.31/mlp/Mul_output_0", "/blocks.31/mlp/down_proj/FakeLinear_output_0", "/blocks.31/Add_1_output_0", "/Slice_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/layers.28/self_attn/q_proj/Linear/pre_reshape", "/layers.28/self_attn/q_proj/Linear/pre_convert", "/layers.28/self_attn/q_proj/Linear", "/layers.28/self_attn/q_proj/Linear/post_convert", "/layers.28/self_attn/k_proj/Linear/pre_reshape", "/layers.28/self_attn/k_proj/Linear/pre_convert", "/layers.28/self_attn/k_proj/Linear", "/layers.28/self_attn/k_proj/Linear/post_convert", "/layers.28/self_attn/v_proj/Linear/pre_reshape", "/layers.28/self_attn/v_proj/Linear/pre_convert", "/layers.28/self_attn/v_proj/Linear", "/layers.28/self_attn/v_proj/Linear/post_convert", "/layers.28/self_attn/o_proj/Linear/pre_reshape", "/layers.28/self_attn/o_proj/Linear/pre_convert", "/layers.28/self_attn/o_proj/Linear", "/layers.28/self_attn/o_proj/Linear/post_convert", "/layers.28/mlp/gate_proj/Linear/pre_reshape", "/layers.28/mlp/gate_proj/Linear/pre_convert", "/layers.28/mlp/gate_proj/Linear", "/layers.28/mlp/gate_proj/Linear/post_convert", "/layers.28/mlp/up_proj/Linear/pre_reshape", "/layers.28/mlp/up_proj/Linear/pre_convert", "/layers.28/mlp/up_proj/Linear", "/layers.28/mlp/up_proj/Linear/post_convert", "/layers.28/mlp/down_proj/Linear/pre_reshape", "/layers.28/mlp/down_proj/Linear/pre_convert", "/layers.28/mlp/down_proj/Linear", "/layers.28/mlp/down_proj/Linear/post_convert", "/layers.29/self_attn/q_proj/Linear/pre_reshape", "/layers.29/self_attn/q_proj/Linear/pre_convert", "/layers.29/self_attn/q_proj/Linear", "/layers.29/self_attn/q_proj/Linear/post_convert", "/layers.29/self_attn/k_proj/Linear/pre_reshape", "/layers.29/self_attn/k_proj/Linear/pre_convert", "/layers.29/self_attn/k_proj/Linear", "/layers.29/self_attn/k_proj/Linear/post_convert", "/layers.29/self_attn/v_proj/Linear/pre_reshape", "/layers.29/self_attn/v_proj/Linear/pre_convert", "/layers.29/self_attn/v_proj/Linear", "/layers.29/self_attn/v_proj/Linear/post_convert", "/layers.29/self_attn/o_proj/Linear/pre_reshape", "/layers.29/self_attn/o_proj/Linear/pre_convert", "/layers.29/self_attn/o_proj/Linear", "/layers.29/self_attn/o_proj/Linear/post_convert", "/layers.29/mlp/gate_proj/Linear/pre_reshape", "/layers.29/mlp/gate_proj/Linear/pre_convert", "/layers.29/mlp/gate_proj/Linear", "/layers.29/mlp/gate_proj/Linear/post_convert", "/layers.29/mlp/up_proj/Linear/pre_reshape", "/layers.29/mlp/up_proj/Linear/pre_convert", "/layers.29/mlp/up_proj/Linear", "/layers.29/mlp/up_proj/Linear/post_convert", "/layers.29/mlp/down_proj/Linear/pre_reshape", "/layers.29/mlp/down_proj/Linear/pre_convert", "/layers.29/mlp/down_proj/Linear", "/layers.29/mlp/down_proj/Linear/post_convert", "/layers.30/self_attn/q_proj/Linear/pre_reshape", "/layers.30/self_attn/q_proj/Linear/pre_convert", "/layers.30/self_attn/q_proj/Linear", "/layers.30/self_attn/q_proj/Linear/post_convert", "/layers.30/self_attn/k_proj/Linear/pre_reshape", "/layers.30/self_attn/k_proj/Linear/pre_convert", "/layers.30/self_attn/k_proj/Linear", "/layers.30/self_attn/k_proj/Linear/post_convert", "/layers.30/self_attn/v_proj/Linear/pre_reshape", "/layers.30/self_attn/v_proj/Linear/pre_convert", "/layers.30/self_attn/v_proj/Linear", "/layers.30/self_attn/v_proj/Linear/post_convert", "/layers.30/self_attn/o_proj/Linear/pre_reshape", "/layers.30/self_attn/o_proj/Linear/pre_convert", "/layers.30/self_attn/o_proj/Linear", "/layers.30/self_attn/o_proj/Linear/post_convert", "/layers.30/mlp/gate_proj/Linear/pre_reshape", "/layers.30/mlp/gate_proj/Linear/pre_convert", "/layers.30/mlp/gate_proj/Linear", "/layers.30/mlp/gate_proj/Linear/post_convert", "/layers.30/mlp/up_proj/Linear/pre_reshape", "/layers.30/mlp/up_proj/Linear/pre_convert", "/layers.30/mlp/up_proj/Linear", "/layers.30/mlp/up_proj/Linear/post_convert", "/layers.30/mlp/down_proj/Linear/pre_reshape", "/layers.30/mlp/down_proj/Linear/pre_convert", "/layers.30/mlp/down_proj/Linear", "/layers.30/mlp/down_proj/Linear/post_convert", "/layers.31/self_attn/q_proj/Linear/pre_reshape", "/layers.31/self_attn/q_proj/Linear/pre_convert", "/layers.31/self_attn/q_proj/Linear", "/layers.31/self_attn/q_proj/Linear/post_convert", "/layers.31/self_attn/k_proj/Linear/pre_reshape", "/layers.31/self_attn/k_proj/Linear/pre_convert", "/layers.31/self_attn/k_proj/Linear", "/layers.31/self_attn/k_proj/Linear/post_convert", "/layers.31/self_attn/v_proj/Linear/pre_reshape", "/layers.31/self_attn/v_proj/Linear/pre_convert", "/layers.31/self_attn/v_proj/Linear", "/layers.31/self_attn/v_proj/Linear/post_convert", "/layers.31/self_attn/o_proj/Linear/pre_reshape", "/layers.31/self_attn/o_proj/Linear/pre_convert", "/layers.31/self_attn/o_proj/Linear", "/layers.31/self_attn/o_proj/Linear/post_convert", "/layers.31/mlp/gate_proj/Linear/pre_reshape", "/layers.31/mlp/gate_proj/Linear/pre_convert", "/layers.31/mlp/gate_proj/Linear", "/layers.31/mlp/gate_proj/Linear/post_convert", "/layers.31/mlp/up_proj/Linear/pre_reshape", "/layers.31/mlp/up_proj/Linear/pre_convert", "/layers.31/mlp/up_proj/Linear", "/layers.31/mlp/up_proj/Linear/post_convert", "/layers.31/mlp/down_proj/Linear/pre_reshape", "/layers.31/mlp/down_proj/Linear/pre_convert", "/layers.31/mlp/down_proj/Linear", "/layers.31/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "b5d3c965-61d1-4789-976f-2af4a7ee5170" }