{ "bizCode": "MNNTest", "extraInfo": { "version": "3.2.4" } , "oplists": [ { "main_type": "Input", "main": { "dims": [ 1, 1, 2560 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "input_ids", "outputIndexes": [ 4 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "attention_mask", "outputIndexes": [ 159 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 3, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "position_ids", "outputIndexes": [ 2 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 36, 2, 1, -1, 8, 128 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "past_key_values", "outputIndexes": [ 0 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "logits_index", "outputIndexes": [ 3 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 3, 1, 2560 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "deepstack_embeds", "outputIndexes": [ 170 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 0 ] , "main_type": "Reshape", "main": { "dims": [ -1 ] , "dimType": "NCHW" } , "name": "presents", "outputIndexes": [ 1 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 3 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1, -1, 2560 ] } , "name": "/Constant_output_0", "outputIndexes": [ 5 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_output_0", "outputIndexes": [ 6 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 0, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm/Mul_1_output_0", "outputIndexes": [ 7 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3456 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3456 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3457 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3457 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20480, 5242902, 1310720, 0, 0 ] } , "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": [ 3458 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3458 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3459 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3459 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 8 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "/Shape_output_0", "outputIndexes": [ 9 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 9 ] , "main_type": "NONE", "name": "Shape52", "outputIndexes": [ 10 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 9 ] , "main_type": "NONE", "name": "Rank54", "outputIndexes": [ 11 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 11, 11 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp56", "outputIndexes": [ 12 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze57", "outputIndexes": [ 13 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Const9", "outputIndexes": [ 14 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp59", "outputIndexes": [ 15 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 15 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze60", "outputIndexes": [ 16 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Unsqueeze62", "outputIndexes": [ 17 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 13, 16, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice63", "outputIndexes": [ 18 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 18 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze64", "outputIndexes": [ 19 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 19 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp66", "outputIndexes": [ 20 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 20, 12 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_1_output_0", "outputIndexes": [ 21 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 0 ] } , "name": "/rotary/Constant_8_output_0", "outputIndexes": [ 22 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_output_0", "outputIndexes": [ 23 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze76", "outputIndexes": [ 24 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 15 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze79", "outputIndexes": [ 25 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 24, 25, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice82", "outputIndexes": [ 26 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 26 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze83", "outputIndexes": [ 27 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 27 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp84", "outputIndexes": [ 28 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 27 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp85", "outputIndexes": [ 29 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 29, 12 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_2_output_0", "outputIndexes": [ 30 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1_output_0", "outputIndexes": [ 31 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 32 ] } , "name": "/Constant_4_output_0", "outputIndexes": [ 32 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 128 ] } , "name": "/Constant_5_output_0", "outputIndexes": [ 33 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 23, 31, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_output_0", "outputIndexes": [ 34 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 34 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_1_output_0", "outputIndexes": [ 35 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 6574102, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm/Mul_1_output_0", "outputIndexes": [ 37 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "name": "/rotary/Cast_output_0", "outputIndexes": [ 38 ] , "type": "Cast", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ -1 ] } , "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 39 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 38, 39 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_output_0", "outputIndexes": [ 40 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40 ] , "main_type": "NONE", "name": "Shape104", "outputIndexes": [ 41 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 40 ] , "main_type": "NONE", "name": "Rank106", "outputIndexes": [ 42 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 42, 42 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp108", "outputIndexes": [ 43 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze109", "outputIndexes": [ 44 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp111", "outputIndexes": [ 45 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze112", "outputIndexes": [ 46 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 44, 46, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice115", "outputIndexes": [ 47 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 47 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze116", "outputIndexes": [ 48 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 48 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp118", "outputIndexes": [ 49 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40, 49, 43 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/rotary/Gather_output_0", "outputIndexes": [ 50 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1, 24 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.0, 0.78583, 0.617529, 0.485273, 0.381342, 0.29967, 0.23549, 0.185055, 0.145422, 0.114277, 0.089802, 0.070569, 0.055455, 0.043578, 0.034245, 0.026911, 0.021147, 0.016618, 0.013059, 0.010262, 0.008064, 0.006337, 0.00498, 0.003913 ] } , "name": "/rotary/Constant_3_output_0", "outputIndexes": [ 51 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 51 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_output_0", "outputIndexes": [ 52 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze127", "outputIndexes": [ 53 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze130", "outputIndexes": [ 54 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 53, 54, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice133", "outputIndexes": [ 55 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 55 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze134", "outputIndexes": [ 56 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 56 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp135", "outputIndexes": [ 57 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 57, 56 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp136", "outputIndexes": [ 58 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40, 58, 43 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/rotary/Gather_1_output_0", "outputIndexes": [ 59 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1, 20 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 0.003075, 0.002417, 0.001899, 0.001492, 0.001173, 0.000922, 0.000724, 0.000569, 0.000447, 0.000351, 0.000276, 0.000217, 0.000171, 0.000134, 0.000105, 0.000083, 0.000065, 0.000051, 0.00004, 0.000032 ] } , "name": "/rotary/Constant_5_output_0", "outputIndexes": [ 60 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 59, 60 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_1_output_0", "outputIndexes": [ 61 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_6_output_0", "outputIndexes": [ 62 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 43 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze146", "outputIndexes": [ 63 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze149", "outputIndexes": [ 64 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 63, 64, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice152", "outputIndexes": [ 65 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 65 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze153", "outputIndexes": [ 66 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 66 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp154", "outputIndexes": [ 67 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 67, 66 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp155", "outputIndexes": [ 68 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40, 68, 43 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/rotary/Gather_2_output_0", "outputIndexes": [ 69 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1, 20 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 0.000025, 0.000019, 0.000015, 0.000012, 0.000009, 0.000007, 0.000006, 0.000005, 0.000004, 0.000003, 0.000002, 0.000002, 0.000001, 0.000001, 0.000001, 0.000001, 0.000001, 0.0, 0.0, 0.0 ] } , "name": "/rotary/Constant_7_output_0", "outputIndexes": [ 70 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 69, 70 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_2_output_0", "outputIndexes": [ 71 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 52, 61, 71 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_output_0", "outputIndexes": [ 72 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 72 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "name": "/rotary/Cos_output_0", "outputIndexes": [ 73 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 73, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": [ 74 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 72 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "name": "/rotary/Sin_output_0", "outputIndexes": [ 75 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 75, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": [ 76 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 74, 76 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/rotary/Concat_1_output_0", "outputIndexes": [ 77 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 77, 77 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_2_output_0", "outputIndexes": [ 78 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_10_output_0", "outputIndexes": [ 79 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 78, 79 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": [ 80 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 80, 17 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_4_output_0", "outputIndexes": [ 81 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 81 ] , "main_type": "NONE", "name": "Shape170", "outputIndexes": [ 82 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 81 ] , "main_type": "NONE", "name": "Rank172", "outputIndexes": [ 83 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 83, 83 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp174", "outputIndexes": [ 84 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 84 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze175", "outputIndexes": [ 85 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 84, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp177", "outputIndexes": [ 86 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 86 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze178", "outputIndexes": [ 87 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 82, 85, 87, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice181", "outputIndexes": [ 88 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 88 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze182", "outputIndexes": [ 89 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 89, 89 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp184", "outputIndexes": [ 90 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 81, 90, 84 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_3_output_0", "outputIndexes": [ 91 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_output_0", "outputIndexes": [ 92 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37 ] , "main_type": "NONE", "name": "/Shape_2_output_0", "outputIndexes": [ 93 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/Constant_11_output_0", "outputIndexes": [ 94 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 93 ] , "main_type": "NONE", "name": "Shape311", "outputIndexes": [ 95 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 93 ] , "main_type": "NONE", "name": "Rank313", "outputIndexes": [ 96 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 96 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp315", "outputIndexes": [ 97 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 97 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze316", "outputIndexes": [ 98 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 97, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp318", "outputIndexes": [ 99 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 99 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze319", "outputIndexes": [ 100 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 95, 98, 100, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice322", "outputIndexes": [ 101 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze323", "outputIndexes": [ 102 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 102 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp324", "outputIndexes": [ 103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 103, 102 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp325", "outputIndexes": [ 104 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 93, 104, 97 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_5_output_0", "outputIndexes": [ 105 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_output_0", "outputIndexes": [ 106 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 106, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_7_output_0", "outputIndexes": [ 107 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1073741824 ] } , "name": "/Constant_20_output_0", "outputIndexes": [ 108 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/Constant_14_output_0", "outputIndexes": [ 109 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 107, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_1_output_0", "outputIndexes": [ 110 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 110 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_output_0", "outputIndexes": [ 111 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 106, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_6_output_0", "outputIndexes": [ 112 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 22, 112, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_output_0", "outputIndexes": [ 113 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 111, 113 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_3_output_0", "outputIndexes": [ 114 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 84 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze220", "outputIndexes": [ 115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 86 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze223", "outputIndexes": [ 116 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 82, 115, 116, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice226", "outputIndexes": [ 117 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 117 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze227", "outputIndexes": [ 118 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 118 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp228", "outputIndexes": [ 119 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 119, 118 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp229", "outputIndexes": [ 120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 81, 120, 84 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_4_output_0", "outputIndexes": [ 121 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 114, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_1_output_0", "outputIndexes": [ 122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 92, 122 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_output_0", "outputIndexes": [ 123 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3457 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 6575126, 1310742, 327680, 0, 0 ] } , "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": [ 3462 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3462 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3463 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3463 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 124 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_2_output_0", "outputIndexes": [ 125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_3_output_0", "outputIndexes": [ 126 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 8 ] } , "name": "/Constant_7_output_0", "outputIndexes": [ 127 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 125, 126, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_1_output_0", "outputIndexes": [ 128 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 124, 128 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_2_output_0", "outputIndexes": [ 129 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 129 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 8213548, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm/Mul_1_output_0", "outputIndexes": [ 131 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_2_output_0", "outputIndexes": [ 132 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131 ] , "main_type": "NONE", "name": "/Shape_3_output_0", "outputIndexes": [ 133 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 133 ] , "main_type": "NONE", "name": "Shape189", "outputIndexes": [ 134 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 133 ] , "main_type": "NONE", "name": "Rank191", "outputIndexes": [ 135 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135, 135 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp193", "outputIndexes": [ 136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze194", "outputIndexes": [ 137 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp196", "outputIndexes": [ 138 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze197", "outputIndexes": [ 139 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 134, 137, 139, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice200", "outputIndexes": [ 140 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze201", "outputIndexes": [ 141 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 141 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp202", "outputIndexes": [ 142 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 142, 141 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp203", "outputIndexes": [ 143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 133, 143, 136 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_6_output_0", "outputIndexes": [ 144 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 144, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_1_output_0", "outputIndexes": [ 145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_9_output_0", "outputIndexes": [ 146 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131, 146, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_3_output_0", "outputIndexes": [ 147 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 147 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_1_output_0", "outputIndexes": [ 148 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_8_output_0", "outputIndexes": [ 149 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 131, 22, 149, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_2_output_0", "outputIndexes": [ 150 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 150 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_4_output_0", "outputIndexes": [ 151 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 151, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_3_output_0", "outputIndexes": [ 152 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 132, 152 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_1_output_0", "outputIndexes": [ 153 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3457 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8214572, 1310742, 327680, 0, 0 ] } , "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": [ 3466 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3466 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3467 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3467 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 154 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_4_output_0", "outputIndexes": [ 155 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 30, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_5_output_0", "outputIndexes": [ 156 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 155, 156, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_2_output_0", "outputIndexes": [ 157 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 154, 157 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_3_output_0", "outputIndexes": [ 158 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 123, 153, 158, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_8_output_0", "outputIndexes": [ 160 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3468 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3468 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3469 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3469 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9852994, 5242902, 1310720, 0, 0 ] } , "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": [ 3470 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3470 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3471 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3471 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 161 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6, 161 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_3_output_0", "outputIndexes": [ 162 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 162 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 16406616, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 163 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 163 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3472 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3472 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3473 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3473 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 16427096, 12451862, 3112960, 0, 0 ] } , "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": [ 3474 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3474 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3475 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3475 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 164 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn/Mul_output_0", "outputIndexes": [ 165 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3473 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 31991918, 12451862, 3112960, 0, 0 ] } , "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": [ 3478 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3478 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3479 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3479 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 166 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 165, 166 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp/Mul_output_0", "outputIndexes": [ 167 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 167 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3480 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3480 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3481 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3481 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47556740, 12451862, 3112960, 0, 0 ] } , "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": [ 3482 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3482 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3483 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3483 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 168 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 162, 168 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_4_output_0", "outputIndexes": [ 169 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170 ] , "main_type": "NONE", "name": "Shape546", "outputIndexes": [ 171 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 170 ] , "main_type": "NONE", "name": "Rank548", "outputIndexes": [ 172 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 172, 172 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp550", "outputIndexes": [ 173 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze551", "outputIndexes": [ 174 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp553", "outputIndexes": [ 175 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze554", "outputIndexes": [ 176 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 171, 174, 176, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice557", "outputIndexes": [ 177 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 177 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze558", "outputIndexes": [ 178 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 178, 178 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp560", "outputIndexes": [ 179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170, 179, 173 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_17_output_0", "outputIndexes": [ 180 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 169, 180 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_5_output_0", "outputIndexes": [ 181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 181, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_9_output_0", "outputIndexes": [ 182 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 182 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 63121562, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_1/Mul_1_output_0", "outputIndexes": [ 183 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 183 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3484 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3484 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3485 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3485 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63142042, 5242902, 1310720, 0, 0 ] } , "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": [ 3486 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3486 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3487 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3487 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 184 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 183 ] , "main_type": "NONE", "name": "/Shape_14_output_0", "outputIndexes": [ 185 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 185 ] , "main_type": "NONE", "name": "Shape573", "outputIndexes": [ 186 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 185 ] , "main_type": "NONE", "name": "Rank575", "outputIndexes": [ 187 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 187, 187 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp577", "outputIndexes": [ 188 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze578", "outputIndexes": [ 189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp580", "outputIndexes": [ 190 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze581", "outputIndexes": [ 191 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 189, 191, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice584", "outputIndexes": [ 192 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 192 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze585", "outputIndexes": [ 193 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 193, 193 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp587", "outputIndexes": [ 194 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 185, 194, 188 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_19_output_0", "outputIndexes": [ 195 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_32_output_0", "outputIndexes": [ 196 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze595", "outputIndexes": [ 197 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze598", "outputIndexes": [ 198 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 197, 198, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice601", "outputIndexes": [ 199 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 199 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze602", "outputIndexes": [ 200 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 200 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp603", "outputIndexes": [ 201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 201, 200 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp604", "outputIndexes": [ 202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 185, 202, 188 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_20_output_0", "outputIndexes": [ 203 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 203, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_33_output_0", "outputIndexes": [ 204 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 196, 204, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_13_output_0", "outputIndexes": [ 205 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 184, 205 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_10_output_0", "outputIndexes": [ 206 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 206 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 69695664, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_1/Mul_1_output_0", "outputIndexes": [ 208 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_8_output_0", "outputIndexes": [ 209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208 ] , "main_type": "NONE", "name": "/Shape_16_output_0", "outputIndexes": [ 210 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 210 ] , "main_type": "NONE", "name": "Shape722", "outputIndexes": [ 211 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 210 ] , "main_type": "NONE", "name": "Rank724", "outputIndexes": [ 212 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 212, 212 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp726", "outputIndexes": [ 213 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 213 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze727", "outputIndexes": [ 214 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 213, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp729", "outputIndexes": [ 215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 215 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze730", "outputIndexes": [ 216 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 211, 214, 216, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice733", "outputIndexes": [ 217 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 217 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze734", "outputIndexes": [ 218 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 218 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp735", "outputIndexes": [ 219 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 219, 218 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp736", "outputIndexes": [ 220 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 210, 220, 213 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_21_output_0", "outputIndexes": [ 221 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 221, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_3_output_0", "outputIndexes": [ 222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 222, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_39_output_0", "outputIndexes": [ 223 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208, 223, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_5_output_0", "outputIndexes": [ 224 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_2_output_0", "outputIndexes": [ 225 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 222, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_38_output_0", "outputIndexes": [ 226 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 208, 22, 226, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_4_output_0", "outputIndexes": [ 227 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225, 227 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_16_output_0", "outputIndexes": [ 228 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_9_output_0", "outputIndexes": [ 229 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 209, 229 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_6_output_0", "outputIndexes": [ 230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3485 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 69696688, 1310742, 327680, 0, 0 ] } , "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": [ 3490 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3490 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3491 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3491 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 231 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_34_output_0", "outputIndexes": [ 232 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 203, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_35_output_0", "outputIndexes": [ 233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232, 233, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_14_output_0", "outputIndexes": [ 234 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 231, 234 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_11_output_0", "outputIndexes": [ 235 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 235 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 71335110, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_1/Mul_1_output_0", "outputIndexes": [ 237 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_10_output_0", "outputIndexes": [ 238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237 ] , "main_type": "NONE", "name": "/Shape_17_output_0", "outputIndexes": [ 239 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 239 ] , "main_type": "NONE", "name": "Shape619", "outputIndexes": [ 240 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 239 ] , "main_type": "NONE", "name": "Rank621", "outputIndexes": [ 241 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 241, 241 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp623", "outputIndexes": [ 242 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 242 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze624", "outputIndexes": [ 243 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 242, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp626", "outputIndexes": [ 244 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 244 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze627", "outputIndexes": [ 245 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 240, 243, 245, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice630", "outputIndexes": [ 246 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 246 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze631", "outputIndexes": [ 247 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 247 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp632", "outputIndexes": [ 248 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 247 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp633", "outputIndexes": [ 249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 239, 249, 242 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_22_output_0", "outputIndexes": [ 250 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_4_output_0", "outputIndexes": [ 251 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_41_output_0", "outputIndexes": [ 252 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 252, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_7_output_0", "outputIndexes": [ 253 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_3_output_0", "outputIndexes": [ 254 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_40_output_0", "outputIndexes": [ 255 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 22, 255, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_6_output_0", "outputIndexes": [ 256 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 254, 256 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_17_output_0", "outputIndexes": [ 257 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 257, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_11_output_0", "outputIndexes": [ 258 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 238, 258 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_7_output_0", "outputIndexes": [ 259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3485 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 71336134, 1310742, 327680, 0, 0 ] } , "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": [ 3494 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3494 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3495 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3495 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 260 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_36_output_0", "outputIndexes": [ 261 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 203, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_37_output_0", "outputIndexes": [ 262 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 261, 262, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_15_output_0", "outputIndexes": [ 263 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 260, 263 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_12_output_0", "outputIndexes": [ 264 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230, 259, 264, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_17_output_0", "outputIndexes": [ 265 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 265 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3496 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3496 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3497 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3497 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 72974556, 5242902, 1310720, 0, 0 ] } , "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": [ 3498 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3498 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3499 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3499 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 266 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 182, 266 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_9_output_0", "outputIndexes": [ 267 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 267 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 79528178, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_1/Mul_1_output_0", "outputIndexes": [ 268 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 268 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3500 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3500 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3501 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3501 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 79548658, 12451862, 3112960, 0, 0 ] } , "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": [ 3502 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3502 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3503 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3503 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 269 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_1/Mul_output_0", "outputIndexes": [ 270 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3501 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 95113480, 12451862, 3112960, 0, 0 ] } , "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": [ 3506 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3506 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3507 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3507 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 271 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 271 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_1/Mul_output_0", "outputIndexes": [ 272 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 272 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3508 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3508 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3509 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3509 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 110678302, 12451862, 3112960, 0, 0 ] } , "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": [ 3510 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3510 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3511 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3511 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 273 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 267, 273 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_10_output_0", "outputIndexes": [ 274 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze956", "outputIndexes": [ 275 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze959", "outputIndexes": [ 276 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 171, 275, 276, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice962", "outputIndexes": [ 277 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze963", "outputIndexes": [ 278 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 278 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp964", "outputIndexes": [ 279 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 279, 278 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp965", "outputIndexes": [ 280 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170, 280, 173 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_33_output_0", "outputIndexes": [ 281 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 274, 281 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_11_output_0", "outputIndexes": [ 282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_18_output_0", "outputIndexes": [ 283 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 283 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 126243124, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_2/Mul_1_output_0", "outputIndexes": [ 284 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 284 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3512 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3512 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3513 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3513 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 126263604, 5242902, 1310720, 0, 0 ] } , "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": [ 3514 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3514 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3515 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3515 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 285 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 284 ] , "main_type": "NONE", "name": "/Shape_28_output_0", "outputIndexes": [ 286 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 286 ] , "main_type": "NONE", "name": "Shape978", "outputIndexes": [ 287 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 286 ] , "main_type": "NONE", "name": "Rank980", "outputIndexes": [ 288 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 288, 288 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp982", "outputIndexes": [ 289 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze983", "outputIndexes": [ 290 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp985", "outputIndexes": [ 291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze986", "outputIndexes": [ 292 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 287, 290, 292, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice989", "outputIndexes": [ 293 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 293 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze990", "outputIndexes": [ 294 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 294, 294 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp992", "outputIndexes": [ 295 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286, 295, 289 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_35_output_0", "outputIndexes": [ 296 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 296, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_64_output_0", "outputIndexes": [ 297 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1000", "outputIndexes": [ 298 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1003", "outputIndexes": [ 299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 287, 298, 299, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1006", "outputIndexes": [ 300 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 300 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1007", "outputIndexes": [ 301 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 301 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1008", "outputIndexes": [ 302 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 302, 301 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1009", "outputIndexes": [ 303 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286, 303, 289 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_36_output_0", "outputIndexes": [ 304 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 304, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_65_output_0", "outputIndexes": [ 305 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 297, 305, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_26_output_0", "outputIndexes": [ 306 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 285, 306 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_19_output_0", "outputIndexes": [ 307 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 307 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 132817226, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_2/Mul_1_output_0", "outputIndexes": [ 309 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 309, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_16_output_0", "outputIndexes": [ 310 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 309 ] , "main_type": "NONE", "name": "/Shape_30_output_0", "outputIndexes": [ 311 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 311 ] , "main_type": "NONE", "name": "Shape1127", "outputIndexes": [ 312 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 311 ] , "main_type": "NONE", "name": "Rank1129", "outputIndexes": [ 313 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 313, 313 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1131", "outputIndexes": [ 314 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1132", "outputIndexes": [ 315 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1134", "outputIndexes": [ 316 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1135", "outputIndexes": [ 317 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 312, 315, 317, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1138", "outputIndexes": [ 318 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1139", "outputIndexes": [ 319 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 319 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1140", "outputIndexes": [ 320 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 320, 319 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1141", "outputIndexes": [ 321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 311, 321, 314 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_37_output_0", "outputIndexes": [ 322 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 322, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_6_output_0", "outputIndexes": [ 323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 323, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_71_output_0", "outputIndexes": [ 324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 309, 324, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_9_output_0", "outputIndexes": [ 325 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 325 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_4_output_0", "outputIndexes": [ 326 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 323, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_70_output_0", "outputIndexes": [ 327 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 309, 22, 327, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_8_output_0", "outputIndexes": [ 328 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 328 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_29_output_0", "outputIndexes": [ 329 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 329, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_17_output_0", "outputIndexes": [ 330 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 310, 330 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_12_output_0", "outputIndexes": [ 331 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3513 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 132818250, 1310742, 327680, 0, 0 ] } , "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": [ 3518 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3518 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3519 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3519 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 332 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 296, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_66_output_0", "outputIndexes": [ 333 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 304, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_67_output_0", "outputIndexes": [ 334 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 333, 334, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_27_output_0", "outputIndexes": [ 335 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 332, 335 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_20_output_0", "outputIndexes": [ 336 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 336 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 134456672, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_2/Mul_1_output_0", "outputIndexes": [ 338 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_18_output_0", "outputIndexes": [ 339 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338 ] , "main_type": "NONE", "name": "/Shape_31_output_0", "outputIndexes": [ 340 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 340 ] , "main_type": "NONE", "name": "Shape1024", "outputIndexes": [ 341 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 340 ] , "main_type": "NONE", "name": "Rank1026", "outputIndexes": [ 342 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342, 342 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1028", "outputIndexes": [ 343 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 343 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1029", "outputIndexes": [ 344 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 343, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1031", "outputIndexes": [ 345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 345 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1032", "outputIndexes": [ 346 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 341, 344, 346, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1035", "outputIndexes": [ 347 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 347 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1036", "outputIndexes": [ 348 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 348 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1037", "outputIndexes": [ 349 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 349, 348 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1038", "outputIndexes": [ 350 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 340, 350, 343 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_38_output_0", "outputIndexes": [ 351 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_7_output_0", "outputIndexes": [ 352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 352, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_73_output_0", "outputIndexes": [ 353 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 353, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_11_output_0", "outputIndexes": [ 354 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 354 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_5_output_0", "outputIndexes": [ 355 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 352, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_72_output_0", "outputIndexes": [ 356 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 22, 356, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_10_output_0", "outputIndexes": [ 357 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 355, 357 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_30_output_0", "outputIndexes": [ 358 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 358, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_19_output_0", "outputIndexes": [ 359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 359 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_13_output_0", "outputIndexes": [ 360 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3513 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 134457696, 1310742, 327680, 0, 0 ] } , "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": [ 3522 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3522 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3523 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3523 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 361 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 296, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_68_output_0", "outputIndexes": [ 362 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 304, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_69_output_0", "outputIndexes": [ 363 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 362, 363, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_28_output_0", "outputIndexes": [ 364 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361, 364 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_21_output_0", "outputIndexes": [ 365 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 331, 360, 365, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_26_output_0", "outputIndexes": [ 366 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3524 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3524 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3525 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3525 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 136096118, 5242902, 1310720, 0, 0 ] } , "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": [ 3526 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3526 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3527 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3527 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 367 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 283, 367 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_15_output_0", "outputIndexes": [ 368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 142649740, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_2/Mul_1_output_0", "outputIndexes": [ 369 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3528 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3528 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3529 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3529 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 142670220, 12451862, 3112960, 0, 0 ] } , "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": [ 3530 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3530 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3531 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3531 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 370 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 370 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_2/Mul_output_0", "outputIndexes": [ 371 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3529 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 158235042, 12451862, 3112960, 0, 0 ] } , "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": [ 3534 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3534 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3535 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3535 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 372 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 371, 372 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_2/Mul_output_0", "outputIndexes": [ 373 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 373 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3536 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3536 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3537 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3537 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 173799864, 12451862, 3112960, 0, 0 ] } , "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": [ 3538 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3538 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3539 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3539 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 374 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 374 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_16_output_0", "outputIndexes": [ 375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1361", "outputIndexes": [ 376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1364", "outputIndexes": [ 377 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 171, 376, 377, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1367", "outputIndexes": [ 378 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 378 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1368", "outputIndexes": [ 379 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 379 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1369", "outputIndexes": [ 380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380, 379 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1370", "outputIndexes": [ 381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170, 381, 173 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_49_output_0", "outputIndexes": [ 382 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 375, 382 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_17_output_0", "outputIndexes": [ 383 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 383, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_27_output_0", "outputIndexes": [ 384 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 384 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 189364686, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_3/Mul_1_output_0", "outputIndexes": [ 385 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 385 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3540 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3540 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3541 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 189385166, 5242902, 1310720, 0, 0 ] } , "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": [ 3542 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3542 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3543 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3543 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 386 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 385 ] , "main_type": "NONE", "name": "/Shape_42_output_0", "outputIndexes": [ 387 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 387 ] , "main_type": "NONE", "name": "Shape1383", "outputIndexes": [ 388 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 387 ] , "main_type": "NONE", "name": "Rank1385", "outputIndexes": [ 389 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 389, 389 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1387", "outputIndexes": [ 390 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 390 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1388", "outputIndexes": [ 391 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 390, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1390", "outputIndexes": [ 392 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 392 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1391", "outputIndexes": [ 393 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 388, 391, 393, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1394", "outputIndexes": [ 394 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1395", "outputIndexes": [ 395 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 395, 395 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1397", "outputIndexes": [ 396 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 387, 396, 390 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_51_output_0", "outputIndexes": [ 397 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_96_output_0", "outputIndexes": [ 398 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 390 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1405", "outputIndexes": [ 399 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 392 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1408", "outputIndexes": [ 400 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 388, 399, 400, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1411", "outputIndexes": [ 401 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 401 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1412", "outputIndexes": [ 402 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 402 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1413", "outputIndexes": [ 403 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403, 402 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1414", "outputIndexes": [ 404 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 387, 404, 390 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_52_output_0", "outputIndexes": [ 405 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_97_output_0", "outputIndexes": [ 406 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 398, 406, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_39_output_0", "outputIndexes": [ 407 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 386, 407 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_28_output_0", "outputIndexes": [ 408 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 195938788, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_3/Mul_1_output_0", "outputIndexes": [ 410 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_24_output_0", "outputIndexes": [ 411 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "NONE", "name": "/Shape_44_output_0", "outputIndexes": [ 412 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 412 ] , "main_type": "NONE", "name": "Shape1532", "outputIndexes": [ 413 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 412 ] , "main_type": "NONE", "name": "Rank1534", "outputIndexes": [ 414 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 414, 414 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1536", "outputIndexes": [ 415 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1537", "outputIndexes": [ 416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1539", "outputIndexes": [ 417 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 417 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1540", "outputIndexes": [ 418 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 413, 416, 418, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1543", "outputIndexes": [ 419 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 419 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1544", "outputIndexes": [ 420 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 420 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1545", "outputIndexes": [ 421 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421, 420 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1546", "outputIndexes": [ 422 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412, 422, 415 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_53_output_0", "outputIndexes": [ 423 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_9_output_0", "outputIndexes": [ 424 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 424, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_103_output_0", "outputIndexes": [ 425 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410, 425, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_13_output_0", "outputIndexes": [ 426 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_6_output_0", "outputIndexes": [ 427 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 424, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_102_output_0", "outputIndexes": [ 428 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410, 22, 428, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_12_output_0", "outputIndexes": [ 429 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 427, 429 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_42_output_0", "outputIndexes": [ 430 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 430, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_25_output_0", "outputIndexes": [ 431 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 411, 431 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_18_output_0", "outputIndexes": [ 432 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 195939812, 1310742, 327680, 0, 0 ] } , "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": [ 3546 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3546 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3547 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3547 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 433 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_98_output_0", "outputIndexes": [ 434 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_99_output_0", "outputIndexes": [ 435 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 434, 435, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_40_output_0", "outputIndexes": [ 436 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 433, 436 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_29_output_0", "outputIndexes": [ 437 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 197578234, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_3/Mul_1_output_0", "outputIndexes": [ 439 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_26_output_0", "outputIndexes": [ 440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439 ] , "main_type": "NONE", "name": "/Shape_45_output_0", "outputIndexes": [ 441 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 441 ] , "main_type": "NONE", "name": "Shape1429", "outputIndexes": [ 442 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 441 ] , "main_type": "NONE", "name": "Rank1431", "outputIndexes": [ 443 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 443, 443 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1433", "outputIndexes": [ 444 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1434", "outputIndexes": [ 445 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 444, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1436", "outputIndexes": [ 446 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 446 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1437", "outputIndexes": [ 447 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 442, 445, 447, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1440", "outputIndexes": [ 448 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 448 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1441", "outputIndexes": [ 449 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 449 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1442", "outputIndexes": [ 450 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 450, 449 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1443", "outputIndexes": [ 451 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 441, 451, 444 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_54_output_0", "outputIndexes": [ 452 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 452, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_10_output_0", "outputIndexes": [ 453 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_105_output_0", "outputIndexes": [ 454 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 454, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_15_output_0", "outputIndexes": [ 455 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_7_output_0", "outputIndexes": [ 456 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_104_output_0", "outputIndexes": [ 457 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 22, 457, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_14_output_0", "outputIndexes": [ 458 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 456, 458 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_43_output_0", "outputIndexes": [ 459 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 459, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_27_output_0", "outputIndexes": [ 460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 440, 460 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_19_output_0", "outputIndexes": [ 461 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3541 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 197579258, 1310742, 327680, 0, 0 ] } , "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": [ 3550 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3550 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3551 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3551 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 462 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_100_output_0", "outputIndexes": [ 463 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_101_output_0", "outputIndexes": [ 464 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 463, 464, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_41_output_0", "outputIndexes": [ 465 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 462, 465 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_30_output_0", "outputIndexes": [ 466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 432, 461, 466, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_35_output_0", "outputIndexes": [ 467 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3552 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3552 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3553 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3553 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 199217680, 5242902, 1310720, 0, 0 ] } , "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": [ 3554 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3554 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3555 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3555 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 468 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 384, 468 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_21_output_0", "outputIndexes": [ 469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 205771302, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_3/Mul_1_output_0", "outputIndexes": [ 470 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 470 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3556 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3556 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3557 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3557 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 205791782, 12451862, 3112960, 0, 0 ] } , "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": [ 3558 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3558 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3559 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3559 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 471 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 471 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_3/Mul_output_0", "outputIndexes": [ 472 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3557 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 221356604, 12451862, 3112960, 0, 0 ] } , "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": [ 3562 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3562 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3563 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3563 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 473 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 472, 473 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_3/Mul_output_0", "outputIndexes": [ 474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 474 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3564 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3564 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3565 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3565 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 236921426, 12451862, 3112960, 0, 0 ] } , "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": [ 3566 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3566 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3567 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3567 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 475 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469, 475 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_22_output_0", "outputIndexes": [ 476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 476, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_36_output_0", "outputIndexes": [ 477 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 477 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 252486248, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_4/Mul_1_output_0", "outputIndexes": [ 478 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 478 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3568 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3568 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3569 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3569 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 252506728, 5242902, 1310720, 0, 0 ] } , "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": [ 3570 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3570 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3571 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3571 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 479 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 478 ] , "main_type": "NONE", "name": "/Shape_56_output_0", "outputIndexes": [ 480 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 480 ] , "main_type": "NONE", "name": "Shape1771", "outputIndexes": [ 481 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 480 ] , "main_type": "NONE", "name": "Rank1773", "outputIndexes": [ 482 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 482, 482 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1775", "outputIndexes": [ 483 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1776", "outputIndexes": [ 484 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1778", "outputIndexes": [ 485 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1779", "outputIndexes": [ 486 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 481, 484, 486, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1782", "outputIndexes": [ 487 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 487 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1783", "outputIndexes": [ 488 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 488, 488 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1785", "outputIndexes": [ 489 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 480, 489, 483 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_66_output_0", "outputIndexes": [ 490 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_128_output_0", "outputIndexes": [ 491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1793", "outputIndexes": [ 492 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1796", "outputIndexes": [ 493 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 481, 492, 493, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1799", "outputIndexes": [ 494 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1800", "outputIndexes": [ 495 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 495 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1801", "outputIndexes": [ 496 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 495 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1802", "outputIndexes": [ 497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 480, 497, 483 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_67_output_0", "outputIndexes": [ 498 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 498, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_129_output_0", "outputIndexes": [ 499 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 491, 499, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_52_output_0", "outputIndexes": [ 500 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 479, 500 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_37_output_0", "outputIndexes": [ 501 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 501 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 259060350, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_4/Mul_1_output_0", "outputIndexes": [ 503 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_32_output_0", "outputIndexes": [ 504 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503 ] , "main_type": "NONE", "name": "/Shape_58_output_0", "outputIndexes": [ 505 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 505 ] , "main_type": "NONE", "name": "Shape1921", "outputIndexes": [ 506 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 505 ] , "main_type": "NONE", "name": "Rank1923", "outputIndexes": [ 507 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 507, 507 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1925", "outputIndexes": [ 508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 508 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1926", "outputIndexes": [ 509 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 508, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1928", "outputIndexes": [ 510 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 510 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1929", "outputIndexes": [ 511 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 506, 509, 511, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1932", "outputIndexes": [ 512 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1933", "outputIndexes": [ 513 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 513 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1934", "outputIndexes": [ 514 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 514, 513 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1935", "outputIndexes": [ 515 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 505, 515, 508 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_68_output_0", "outputIndexes": [ 516 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 516, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_12_output_0", "outputIndexes": [ 517 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_135_output_0", "outputIndexes": [ 518 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503, 518, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_17_output_0", "outputIndexes": [ 519 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 519 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_8_output_0", "outputIndexes": [ 520 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_134_output_0", "outputIndexes": [ 521 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 503, 22, 521, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_16_output_0", "outputIndexes": [ 522 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 520, 522 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_55_output_0", "outputIndexes": [ 523 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 523, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_33_output_0", "outputIndexes": [ 524 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 524 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_23_output_0", "outputIndexes": [ 525 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3569 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 259061374, 1310742, 327680, 0, 0 ] } , "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": [ 3574 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3574 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3575 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3575 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 526 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_130_output_0", "outputIndexes": [ 527 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 498, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_131_output_0", "outputIndexes": [ 528 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 527, 528, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_53_output_0", "outputIndexes": [ 529 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 526, 529 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_38_output_0", "outputIndexes": [ 530 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 530 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 260699796, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_4/Mul_1_output_0", "outputIndexes": [ 532 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_34_output_0", "outputIndexes": [ 533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532 ] , "main_type": "NONE", "name": "/Shape_59_output_0", "outputIndexes": [ 534 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 534 ] , "main_type": "NONE", "name": "Shape1817", "outputIndexes": [ 535 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 534 ] , "main_type": "NONE", "name": "Rank1819", "outputIndexes": [ 536 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 536, 536 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1821", "outputIndexes": [ 537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1822", "outputIndexes": [ 538 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1824", "outputIndexes": [ 539 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 539 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1825", "outputIndexes": [ 540 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 535, 538, 540, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1828", "outputIndexes": [ 541 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 541 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1829", "outputIndexes": [ 542 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 542 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1830", "outputIndexes": [ 543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 543, 542 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1831", "outputIndexes": [ 544 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 534, 544, 537 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_69_output_0", "outputIndexes": [ 545 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 545, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_13_output_0", "outputIndexes": [ 546 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_137_output_0", "outputIndexes": [ 547 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 547, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_19_output_0", "outputIndexes": [ 548 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 548 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_9_output_0", "outputIndexes": [ 549 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_136_output_0", "outputIndexes": [ 550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 22, 550, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_18_output_0", "outputIndexes": [ 551 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 549, 551 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_56_output_0", "outputIndexes": [ 552 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 552, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_35_output_0", "outputIndexes": [ 553 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 533, 553 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_24_output_0", "outputIndexes": [ 554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3569 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 260700820, 1310742, 327680, 0, 0 ] } , "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": [ 3578 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3578 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3579 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3579 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 555 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_132_output_0", "outputIndexes": [ 556 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 498, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_133_output_0", "outputIndexes": [ 557 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 556, 557, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_54_output_0", "outputIndexes": [ 558 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 555, 558 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_39_output_0", "outputIndexes": [ 559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 525, 554, 559, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_44_output_0", "outputIndexes": [ 560 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 560 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3580 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3580 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3581 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3581 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 262339242, 5242902, 1310720, 0, 0 ] } , "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": [ 3582 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3582 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3583 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3583 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 561 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 477, 561 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_26_output_0", "outputIndexes": [ 562 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 562 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 268892864, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_4/Mul_1_output_0", "outputIndexes": [ 563 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 563 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3584 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3584 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3585 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3585 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 268913344, 12451862, 3112960, 0, 0 ] } , "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": [ 3586 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3586 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3587 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3587 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 564 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 564 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_4/Mul_output_0", "outputIndexes": [ 565 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3585 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 284478166, 12451862, 3112960, 0, 0 ] } , "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": [ 3590 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3590 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3591 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3591 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 566 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 565, 566 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_4/Mul_output_0", "outputIndexes": [ 567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 567 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3592 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3592 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3593 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3593 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 300042988, 12451862, 3112960, 0, 0 ] } , "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": [ 3594 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3594 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3595 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3595 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 568 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 562, 568 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_27_output_0", "outputIndexes": [ 569 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 569, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_45_output_0", "outputIndexes": [ 570 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 315607810, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_5/Mul_1_output_0", "outputIndexes": [ 571 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 571 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3596 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3596 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3597 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3597 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 315628290, 5242902, 1310720, 0, 0 ] } , "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": [ 3598 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3598 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3599 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3599 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 572 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 571 ] , "main_type": "NONE", "name": "/Shape_70_output_0", "outputIndexes": [ 573 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 573 ] , "main_type": "NONE", "name": "Shape2160", "outputIndexes": [ 574 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 573 ] , "main_type": "NONE", "name": "Rank2162", "outputIndexes": [ 575 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575, 575 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2164", "outputIndexes": [ 576 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 576 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2165", "outputIndexes": [ 577 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 576, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2167", "outputIndexes": [ 578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 578 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2168", "outputIndexes": [ 579 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 574, 577, 579, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2171", "outputIndexes": [ 580 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2172", "outputIndexes": [ 581 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581, 581 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2174", "outputIndexes": [ 582 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573, 582, 576 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_81_output_0", "outputIndexes": [ 583 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_160_output_0", "outputIndexes": [ 584 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 576 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2182", "outputIndexes": [ 585 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 578 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2185", "outputIndexes": [ 586 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 574, 585, 586, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2188", "outputIndexes": [ 587 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 587 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2189", "outputIndexes": [ 588 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 588 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2190", "outputIndexes": [ 589 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 589, 588 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2191", "outputIndexes": [ 590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573, 590, 576 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_82_output_0", "outputIndexes": [ 591 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 591, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_161_output_0", "outputIndexes": [ 592 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584, 592, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_65_output_0", "outputIndexes": [ 593 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572, 593 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_46_output_0", "outputIndexes": [ 594 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 594 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 322181912, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_5/Mul_1_output_0", "outputIndexes": [ 596 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_40_output_0", "outputIndexes": [ 597 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596 ] , "main_type": "NONE", "name": "/Shape_72_output_0", "outputIndexes": [ 598 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 598 ] , "main_type": "NONE", "name": "Shape2310", "outputIndexes": [ 599 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 598 ] , "main_type": "NONE", "name": "Rank2312", "outputIndexes": [ 600 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 600, 600 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2314", "outputIndexes": [ 601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2315", "outputIndexes": [ 602 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2317", "outputIndexes": [ 603 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 603 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2318", "outputIndexes": [ 604 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 599, 602, 604, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2321", "outputIndexes": [ 605 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 605 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2322", "outputIndexes": [ 606 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 606 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2323", "outputIndexes": [ 607 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 607, 606 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2324", "outputIndexes": [ 608 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 598, 608, 601 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_83_output_0", "outputIndexes": [ 609 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_15_output_0", "outputIndexes": [ 610 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_167_output_0", "outputIndexes": [ 611 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596, 611, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_21_output_0", "outputIndexes": [ 612 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 612 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_10_output_0", "outputIndexes": [ 613 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 610, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_166_output_0", "outputIndexes": [ 614 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 596, 22, 614, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_20_output_0", "outputIndexes": [ 615 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 613, 615 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_68_output_0", "outputIndexes": [ 616 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 616, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_41_output_0", "outputIndexes": [ 617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 597, 617 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_28_output_0", "outputIndexes": [ 618 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3597 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 322182936, 1310742, 327680, 0, 0 ] } , "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": [ 3602 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3602 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3603 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3603 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 619 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_162_output_0", "outputIndexes": [ 620 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 591, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_163_output_0", "outputIndexes": [ 621 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 620, 621, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_66_output_0", "outputIndexes": [ 622 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 619, 622 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_47_output_0", "outputIndexes": [ 623 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 623 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 323821358, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_5/Mul_1_output_0", "outputIndexes": [ 625 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_42_output_0", "outputIndexes": [ 626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625 ] , "main_type": "NONE", "name": "/Shape_73_output_0", "outputIndexes": [ 627 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 627 ] , "main_type": "NONE", "name": "Shape2206", "outputIndexes": [ 628 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 627 ] , "main_type": "NONE", "name": "Rank2208", "outputIndexes": [ 629 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 629, 629 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2210", "outputIndexes": [ 630 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2211", "outputIndexes": [ 631 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 630, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2213", "outputIndexes": [ 632 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 632 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2214", "outputIndexes": [ 633 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 628, 631, 633, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2217", "outputIndexes": [ 634 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 634 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2218", "outputIndexes": [ 635 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 635 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2219", "outputIndexes": [ 636 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636, 635 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2220", "outputIndexes": [ 637 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 627, 637, 630 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_84_output_0", "outputIndexes": [ 638 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 638, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_16_output_0", "outputIndexes": [ 639 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 639, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_169_output_0", "outputIndexes": [ 640 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625, 640, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_23_output_0", "outputIndexes": [ 641 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 641 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_11_output_0", "outputIndexes": [ 642 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 639, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_168_output_0", "outputIndexes": [ 643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 625, 22, 643, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_22_output_0", "outputIndexes": [ 644 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 642, 644 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_69_output_0", "outputIndexes": [ 645 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 645, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_43_output_0", "outputIndexes": [ 646 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 626, 646 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_29_output_0", "outputIndexes": [ 647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3597 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 323822382, 1310742, 327680, 0, 0 ] } , "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": [ 3606 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3606 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3607 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3607 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 648 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_164_output_0", "outputIndexes": [ 649 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 591, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_165_output_0", "outputIndexes": [ 650 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 649, 650, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_67_output_0", "outputIndexes": [ 651 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 648, 651 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_48_output_0", "outputIndexes": [ 652 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 618, 647, 652, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_53_output_0", "outputIndexes": [ 653 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 653 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3608 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3608 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3609 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3609 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 325460804, 5242902, 1310720, 0, 0 ] } , "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": [ 3610 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3610 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3611 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3611 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 654 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570, 654 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_31_output_0", "outputIndexes": [ 655 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 655 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 332014426, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_5/Mul_1_output_0", "outputIndexes": [ 656 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 656 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3612 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3613 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3613 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 332034906, 12451862, 3112960, 0, 0 ] } , "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": [ 3614 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3614 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3615 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3615 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 657 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 657 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_5/Mul_output_0", "outputIndexes": [ 658 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3613 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 347599728, 12451862, 3112960, 0, 0 ] } , "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": [ 3618 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3618 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3619 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3619 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 659 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 658, 659 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_5/Mul_output_0", "outputIndexes": [ 660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 660 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3620 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3620 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3621 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3621 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 363164550, 12451862, 3112960, 0, 0 ] } , "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": [ 3622 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3622 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3623 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3623 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 661 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 655, 661 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_32_output_0", "outputIndexes": [ 662 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 662, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_54_output_0", "outputIndexes": [ 663 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 378729372, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_6/Mul_1_output_0", "outputIndexes": [ 664 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3624 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3624 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3625 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3625 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 378749852, 5242902, 1310720, 0, 0 ] } , "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": [ 3626 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3626 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3627 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3627 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664 ] , "main_type": "NONE", "name": "/Shape_84_output_0", "outputIndexes": [ 666 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 666 ] , "main_type": "NONE", "name": "Shape2549", "outputIndexes": [ 667 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 666 ] , "main_type": "NONE", "name": "Rank2551", "outputIndexes": [ 668 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 668, 668 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2553", "outputIndexes": [ 669 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2554", "outputIndexes": [ 670 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2556", "outputIndexes": [ 671 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 671 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2557", "outputIndexes": [ 672 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 667, 670, 672, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2560", "outputIndexes": [ 673 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2561", "outputIndexes": [ 674 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674, 674 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2563", "outputIndexes": [ 675 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666, 675, 669 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_96_output_0", "outputIndexes": [ 676 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_192_output_0", "outputIndexes": [ 677 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2571", "outputIndexes": [ 678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 671 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2574", "outputIndexes": [ 679 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 667, 678, 679, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2577", "outputIndexes": [ 680 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 680 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2578", "outputIndexes": [ 681 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 681 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2579", "outputIndexes": [ 682 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 681 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2580", "outputIndexes": [ 683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666, 683, 669 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_97_output_0", "outputIndexes": [ 684 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_193_output_0", "outputIndexes": [ 685 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677, 685, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_78_output_0", "outputIndexes": [ 686 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 665, 686 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_55_output_0", "outputIndexes": [ 687 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 687 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 385303474, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_6/Mul_1_output_0", "outputIndexes": [ 689 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 689, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_48_output_0", "outputIndexes": [ 690 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 689 ] , "main_type": "NONE", "name": "/Shape_86_output_0", "outputIndexes": [ 691 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 691 ] , "main_type": "NONE", "name": "Shape2699", "outputIndexes": [ 692 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 691 ] , "main_type": "NONE", "name": "Rank2701", "outputIndexes": [ 693 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 693 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2703", "outputIndexes": [ 694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2704", "outputIndexes": [ 695 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2706", "outputIndexes": [ 696 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 696 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2707", "outputIndexes": [ 697 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 692, 695, 697, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2710", "outputIndexes": [ 698 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2711", "outputIndexes": [ 699 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 699 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2712", "outputIndexes": [ 700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700, 699 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2713", "outputIndexes": [ 701 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 691, 701, 694 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_98_output_0", "outputIndexes": [ 702 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 702, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_18_output_0", "outputIndexes": [ 703 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 703, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_199_output_0", "outputIndexes": [ 704 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 689, 704, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_25_output_0", "outputIndexes": [ 705 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 705 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_12_output_0", "outputIndexes": [ 706 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 703, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_198_output_0", "outputIndexes": [ 707 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 689, 22, 707, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_24_output_0", "outputIndexes": [ 708 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 706, 708 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_81_output_0", "outputIndexes": [ 709 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 709, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_49_output_0", "outputIndexes": [ 710 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 710 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_33_output_0", "outputIndexes": [ 711 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3625 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 385304498, 1310742, 327680, 0, 0 ] } , "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": [ 3630 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3630 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3631 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3631 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 712 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_194_output_0", "outputIndexes": [ 713 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_195_output_0", "outputIndexes": [ 714 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 713, 714, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_79_output_0", "outputIndexes": [ 715 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 712, 715 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_56_output_0", "outputIndexes": [ 716 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 716 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 386942920, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_6/Mul_1_output_0", "outputIndexes": [ 718 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_50_output_0", "outputIndexes": [ 719 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718 ] , "main_type": "NONE", "name": "/Shape_87_output_0", "outputIndexes": [ 720 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 720 ] , "main_type": "NONE", "name": "Shape2595", "outputIndexes": [ 721 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 720 ] , "main_type": "NONE", "name": "Rank2597", "outputIndexes": [ 722 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 722 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2599", "outputIndexes": [ 723 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2600", "outputIndexes": [ 724 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2602", "outputIndexes": [ 725 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2603", "outputIndexes": [ 726 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 721, 724, 726, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2606", "outputIndexes": [ 727 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 727 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2607", "outputIndexes": [ 728 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 728 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2608", "outputIndexes": [ 729 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 729, 728 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2609", "outputIndexes": [ 730 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 730, 723 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_99_output_0", "outputIndexes": [ 731 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 731, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_19_output_0", "outputIndexes": [ 732 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 732, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_201_output_0", "outputIndexes": [ 733 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 733, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_27_output_0", "outputIndexes": [ 734 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_13_output_0", "outputIndexes": [ 735 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 732, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_200_output_0", "outputIndexes": [ 736 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 718, 22, 736, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_26_output_0", "outputIndexes": [ 737 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 735, 737 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_82_output_0", "outputIndexes": [ 738 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 738, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_51_output_0", "outputIndexes": [ 739 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 719, 739 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_34_output_0", "outputIndexes": [ 740 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3625 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 386943944, 1310742, 327680, 0, 0 ] } , "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": [ 3634 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3634 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3635 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3635 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 741 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 676, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_196_output_0", "outputIndexes": [ 742 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 684, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_197_output_0", "outputIndexes": [ 743 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 742, 743, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_80_output_0", "outputIndexes": [ 744 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 741, 744 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_57_output_0", "outputIndexes": [ 745 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 711, 740, 745, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_62_output_0", "outputIndexes": [ 746 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 746 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3636 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3636 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3637 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3637 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 388582366, 5242902, 1310720, 0, 0 ] } , "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": [ 3638 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3638 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3639 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3639 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 747 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663, 747 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_36_output_0", "outputIndexes": [ 748 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 748 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 395135988, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_6/Mul_1_output_0", "outputIndexes": [ 749 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 749 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3640 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3640 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3641 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3641 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 395156468, 12451862, 3112960, 0, 0 ] } , "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": [ 3642 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3642 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3643 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3643 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 750 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_6/Mul_output_0", "outputIndexes": [ 751 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3641 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 410721290, 12451862, 3112960, 0, 0 ] } , "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": [ 3646 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3646 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3647 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3647 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 752 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 751, 752 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_6/Mul_output_0", "outputIndexes": [ 753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 753 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3648 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3648 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3649 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3649 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 426286112, 12451862, 3112960, 0, 0 ] } , "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": [ 3650 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3650 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3651 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3651 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 754 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 748, 754 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_37_output_0", "outputIndexes": [ 755 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_63_output_0", "outputIndexes": [ 756 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 756 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 441850934, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_7/Mul_1_output_0", "outputIndexes": [ 757 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3652 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3652 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3653 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3653 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 441871414, 5242902, 1310720, 0, 0 ] } , "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": [ 3654 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3654 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3655 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3655 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 758 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757 ] , "main_type": "NONE", "name": "/Shape_98_output_0", "outputIndexes": [ 759 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 759 ] , "main_type": "NONE", "name": "Shape2938", "outputIndexes": [ 760 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 759 ] , "main_type": "NONE", "name": "Rank2940", "outputIndexes": [ 761 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761, 761 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2942", "outputIndexes": [ 762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2943", "outputIndexes": [ 763 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2945", "outputIndexes": [ 764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2946", "outputIndexes": [ 765 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 760, 763, 765, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2949", "outputIndexes": [ 766 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2950", "outputIndexes": [ 767 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 767, 767 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2952", "outputIndexes": [ 768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759, 768, 762 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_111_output_0", "outputIndexes": [ 769 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_224_output_0", "outputIndexes": [ 770 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2960", "outputIndexes": [ 771 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2963", "outputIndexes": [ 772 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 760, 771, 772, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2966", "outputIndexes": [ 773 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 773 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2967", "outputIndexes": [ 774 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 774 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2968", "outputIndexes": [ 775 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 775, 774 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2969", "outputIndexes": [ 776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759, 776, 762 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_112_output_0", "outputIndexes": [ 777 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 777, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_225_output_0", "outputIndexes": [ 778 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 770, 778, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_91_output_0", "outputIndexes": [ 779 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 758, 779 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_64_output_0", "outputIndexes": [ 780 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 780 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 448425036, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_7/Mul_1_output_0", "outputIndexes": [ 782 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_56_output_0", "outputIndexes": [ 783 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782 ] , "main_type": "NONE", "name": "/Shape_100_output_0", "outputIndexes": [ 784 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "Shape3088", "outputIndexes": [ 785 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "Rank3090", "outputIndexes": [ 786 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 786, 786 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3092", "outputIndexes": [ 787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3093", "outputIndexes": [ 788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3095", "outputIndexes": [ 789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3096", "outputIndexes": [ 790 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785, 788, 790, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3099", "outputIndexes": [ 791 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 791 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3100", "outputIndexes": [ 792 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 792 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3101", "outputIndexes": [ 793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793, 792 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3102", "outputIndexes": [ 794 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 794, 787 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_113_output_0", "outputIndexes": [ 795 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 795, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_21_output_0", "outputIndexes": [ 796 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_231_output_0", "outputIndexes": [ 797 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 797, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_29_output_0", "outputIndexes": [ 798 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_14_output_0", "outputIndexes": [ 799 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_230_output_0", "outputIndexes": [ 800 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 22, 800, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_28_output_0", "outputIndexes": [ 801 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 799, 801 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_94_output_0", "outputIndexes": [ 802 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 802, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_57_output_0", "outputIndexes": [ 803 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 783, 803 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_38_output_0", "outputIndexes": [ 804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3653 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 448426060, 1310742, 327680, 0, 0 ] } , "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": [ 3658 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3658 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3659 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3659 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 805 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_226_output_0", "outputIndexes": [ 806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 777, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_227_output_0", "outputIndexes": [ 807 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 806, 807, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_92_output_0", "outputIndexes": [ 808 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805, 808 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_65_output_0", "outputIndexes": [ 809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 450064482, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_7/Mul_1_output_0", "outputIndexes": [ 811 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_58_output_0", "outputIndexes": [ 812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811 ] , "main_type": "NONE", "name": "/Shape_101_output_0", "outputIndexes": [ 813 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 813 ] , "main_type": "NONE", "name": "Shape2984", "outputIndexes": [ 814 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 813 ] , "main_type": "NONE", "name": "Rank2986", "outputIndexes": [ 815 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 815, 815 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2988", "outputIndexes": [ 816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2989", "outputIndexes": [ 817 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2991", "outputIndexes": [ 818 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 818 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2992", "outputIndexes": [ 819 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814, 817, 819, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2995", "outputIndexes": [ 820 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 820 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2996", "outputIndexes": [ 821 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 821 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2997", "outputIndexes": [ 822 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 822, 821 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2998", "outputIndexes": [ 823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 813, 823, 816 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_114_output_0", "outputIndexes": [ 824 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 824, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_22_output_0", "outputIndexes": [ 825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_233_output_0", "outputIndexes": [ 826 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 826, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_31_output_0", "outputIndexes": [ 827 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 827 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_15_output_0", "outputIndexes": [ 828 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_232_output_0", "outputIndexes": [ 829 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 22, 829, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_30_output_0", "outputIndexes": [ 830 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 828, 830 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_95_output_0", "outputIndexes": [ 831 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 831, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_59_output_0", "outputIndexes": [ 832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 812, 832 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_39_output_0", "outputIndexes": [ 833 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3653 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 450065506, 1310742, 327680, 0, 0 ] } , "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": [ 3662 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3662 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3663 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3663 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 834 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_228_output_0", "outputIndexes": [ 835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 777, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_229_output_0", "outputIndexes": [ 836 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 835, 836, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_93_output_0", "outputIndexes": [ 837 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 834, 837 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_66_output_0", "outputIndexes": [ 838 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 804, 833, 838, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_71_output_0", "outputIndexes": [ 839 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3664 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3664 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3665 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3665 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 451703928, 5242902, 1310720, 0, 0 ] } , "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": [ 3666 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3666 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3667 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3667 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 840 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 756, 840 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_41_output_0", "outputIndexes": [ 841 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 458257550, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_7/Mul_1_output_0", "outputIndexes": [ 842 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 842 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3668 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3668 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3669 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3669 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 458278030, 12451862, 3112960, 0, 0 ] } , "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": [ 3670 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3670 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3671 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3671 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 843 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 843 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_7/Mul_output_0", "outputIndexes": [ 844 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3669 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 473842852, 12451862, 3112960, 0, 0 ] } , "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": [ 3674 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3674 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3675 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3675 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 845 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 844, 845 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_7/Mul_output_0", "outputIndexes": [ 846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 846 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3676 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3676 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3677 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3677 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 489407674, 12451862, 3112960, 0, 0 ] } , "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": [ 3678 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3678 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3679 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3679 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 847 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841, 847 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_42_output_0", "outputIndexes": [ 848 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_72_output_0", "outputIndexes": [ 849 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 504972496, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_8/Mul_1_output_0", "outputIndexes": [ 850 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3680 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3680 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3681 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3681 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 504992976, 5242902, 1310720, 0, 0 ] } , "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": [ 3682 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3682 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3683 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3683 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 851 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850 ] , "main_type": "NONE", "name": "/Shape_112_output_0", "outputIndexes": [ 852 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 852 ] , "main_type": "NONE", "name": "Shape3327", "outputIndexes": [ 853 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 852 ] , "main_type": "NONE", "name": "Rank3329", "outputIndexes": [ 854 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 854, 854 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3331", "outputIndexes": [ 855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3332", "outputIndexes": [ 856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3334", "outputIndexes": [ 857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3335", "outputIndexes": [ 858 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853, 856, 858, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3338", "outputIndexes": [ 859 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 859 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3339", "outputIndexes": [ 860 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 860 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3341", "outputIndexes": [ 861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 861, 855 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_126_output_0", "outputIndexes": [ 862 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_256_output_0", "outputIndexes": [ 863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3349", "outputIndexes": [ 864 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3352", "outputIndexes": [ 865 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853, 864, 865, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3355", "outputIndexes": [ 866 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 866 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3356", "outputIndexes": [ 867 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 867 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3357", "outputIndexes": [ 868 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 867 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3358", "outputIndexes": [ 869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 869, 855 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_127_output_0", "outputIndexes": [ 870 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_257_output_0", "outputIndexes": [ 871 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 863, 871, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_104_output_0", "outputIndexes": [ 872 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 872 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_73_output_0", "outputIndexes": [ 873 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 511546598, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_8/Mul_1_output_0", "outputIndexes": [ 875 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_64_output_0", "outputIndexes": [ 876 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875 ] , "main_type": "NONE", "name": "/Shape_114_output_0", "outputIndexes": [ 877 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 877 ] , "main_type": "NONE", "name": "Shape3477", "outputIndexes": [ 878 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 877 ] , "main_type": "NONE", "name": "Rank3479", "outputIndexes": [ 879 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 879, 879 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3481", "outputIndexes": [ 880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3482", "outputIndexes": [ 881 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3484", "outputIndexes": [ 882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 882 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3485", "outputIndexes": [ 883 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878, 881, 883, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3488", "outputIndexes": [ 884 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3489", "outputIndexes": [ 885 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 885 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3490", "outputIndexes": [ 886 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 886, 885 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3491", "outputIndexes": [ 887 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 877, 887, 880 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_128_output_0", "outputIndexes": [ 888 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 888, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_24_output_0", "outputIndexes": [ 889 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_263_output_0", "outputIndexes": [ 890 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 890, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_33_output_0", "outputIndexes": [ 891 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_16_output_0", "outputIndexes": [ 892 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 889, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_262_output_0", "outputIndexes": [ 893 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 22, 893, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_32_output_0", "outputIndexes": [ 894 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 892, 894 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_107_output_0", "outputIndexes": [ 895 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 895, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_65_output_0", "outputIndexes": [ 896 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876, 896 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_43_output_0", "outputIndexes": [ 897 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3681 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 511547622, 1310742, 327680, 0, 0 ] } , "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": [ 3686 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3686 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3687 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3687 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 898 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_258_output_0", "outputIndexes": [ 899 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_259_output_0", "outputIndexes": [ 900 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 899, 900, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_105_output_0", "outputIndexes": [ 901 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 901 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_74_output_0", "outputIndexes": [ 902 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 902 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 513186044, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_8/Mul_1_output_0", "outputIndexes": [ 904 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_66_output_0", "outputIndexes": [ 905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904 ] , "main_type": "NONE", "name": "/Shape_115_output_0", "outputIndexes": [ 906 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 906 ] , "main_type": "NONE", "name": "Shape3373", "outputIndexes": [ 907 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 906 ] , "main_type": "NONE", "name": "Rank3375", "outputIndexes": [ 908 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 908, 908 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3377", "outputIndexes": [ 909 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3378", "outputIndexes": [ 910 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3380", "outputIndexes": [ 911 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3381", "outputIndexes": [ 912 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 907, 910, 912, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3384", "outputIndexes": [ 913 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 913 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3385", "outputIndexes": [ 914 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 914 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3386", "outputIndexes": [ 915 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 915, 914 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3387", "outputIndexes": [ 916 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 906, 916, 909 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_129_output_0", "outputIndexes": [ 917 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 917, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_25_output_0", "outputIndexes": [ 918 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 918, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_265_output_0", "outputIndexes": [ 919 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 919, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_35_output_0", "outputIndexes": [ 920 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 920 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_17_output_0", "outputIndexes": [ 921 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 918, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_264_output_0", "outputIndexes": [ 922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 904, 22, 922, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_34_output_0", "outputIndexes": [ 923 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 921, 923 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_108_output_0", "outputIndexes": [ 924 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 924, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_67_output_0", "outputIndexes": [ 925 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 905, 925 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_44_output_0", "outputIndexes": [ 926 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3681 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 513187068, 1310742, 327680, 0, 0 ] } , "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": [ 3690 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3690 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3691 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3691 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 927 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 862, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_260_output_0", "outputIndexes": [ 928 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 870, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_261_output_0", "outputIndexes": [ 929 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928, 929, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_106_output_0", "outputIndexes": [ 930 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 927, 930 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_75_output_0", "outputIndexes": [ 931 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 897, 926, 931, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_80_output_0", "outputIndexes": [ 932 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 932 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3692 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3692 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3693 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3693 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 514825490, 5242902, 1310720, 0, 0 ] } , "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": [ 3694 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3694 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3695 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3695 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 933 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849, 933 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_46_output_0", "outputIndexes": [ 934 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 934 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 521379112, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_8/Mul_1_output_0", "outputIndexes": [ 935 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 935 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3696 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3696 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3697 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3697 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 521399592, 12451862, 3112960, 0, 0 ] } , "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": [ 3698 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3698 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3699 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3699 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 936 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_8/Mul_output_0", "outputIndexes": [ 937 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3697 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 536964414, 12451862, 3112960, 0, 0 ] } , "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": [ 3702 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3702 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3703 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3703 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 938 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937, 938 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_8/Mul_output_0", "outputIndexes": [ 939 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3704 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3704 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3705 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3705 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 552529236, 12451862, 3112960, 0, 0 ] } , "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": [ 3706 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3706 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3707 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3707 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 940 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 934, 940 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_47_output_0", "outputIndexes": [ 941 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 941, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_81_output_0", "outputIndexes": [ 942 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 568094058, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_9/Mul_1_output_0", "outputIndexes": [ 943 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 943 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3708 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3708 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3709 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 568114538, 5242902, 1310720, 0, 0 ] } , "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": [ 3710 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3710 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3711 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3711 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 944 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 943 ] , "main_type": "NONE", "name": "/Shape_126_output_0", "outputIndexes": [ 945 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 945 ] , "main_type": "NONE", "name": "Shape3716", "outputIndexes": [ 946 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 945 ] , "main_type": "NONE", "name": "Rank3718", "outputIndexes": [ 947 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 947, 947 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3720", "outputIndexes": [ 948 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 948 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3721", "outputIndexes": [ 949 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 948, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3723", "outputIndexes": [ 950 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 950 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3724", "outputIndexes": [ 951 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946, 949, 951, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3727", "outputIndexes": [ 952 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 952 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3728", "outputIndexes": [ 953 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953, 953 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3730", "outputIndexes": [ 954 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 945, 954, 948 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_141_output_0", "outputIndexes": [ 955 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_288_output_0", "outputIndexes": [ 956 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 948 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3738", "outputIndexes": [ 957 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 950 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3741", "outputIndexes": [ 958 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946, 957, 958, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3744", "outputIndexes": [ 959 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 959 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3745", "outputIndexes": [ 960 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 960 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3746", "outputIndexes": [ 961 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 961, 960 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3747", "outputIndexes": [ 962 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 945, 962, 948 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_142_output_0", "outputIndexes": [ 963 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 963, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_289_output_0", "outputIndexes": [ 964 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 956, 964, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_117_output_0", "outputIndexes": [ 965 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944, 965 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_82_output_0", "outputIndexes": [ 966 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 966 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 574668160, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_9/Mul_1_output_0", "outputIndexes": [ 968 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 968, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_72_output_0", "outputIndexes": [ 969 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 968 ] , "main_type": "NONE", "name": "/Shape_128_output_0", "outputIndexes": [ 970 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 970 ] , "main_type": "NONE", "name": "Shape3866", "outputIndexes": [ 971 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 970 ] , "main_type": "NONE", "name": "Rank3868", "outputIndexes": [ 972 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 972, 972 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3870", "outputIndexes": [ 973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3871", "outputIndexes": [ 974 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3873", "outputIndexes": [ 975 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 975 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3874", "outputIndexes": [ 976 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 971, 974, 976, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3877", "outputIndexes": [ 977 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 977 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3878", "outputIndexes": [ 978 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 978 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3879", "outputIndexes": [ 979 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 979, 978 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3880", "outputIndexes": [ 980 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 970, 980, 973 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_143_output_0", "outputIndexes": [ 981 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 981, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_27_output_0", "outputIndexes": [ 982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_295_output_0", "outputIndexes": [ 983 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 968, 983, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_37_output_0", "outputIndexes": [ 984 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_18_output_0", "outputIndexes": [ 985 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_294_output_0", "outputIndexes": [ 986 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 968, 22, 986, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_36_output_0", "outputIndexes": [ 987 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 985, 987 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_120_output_0", "outputIndexes": [ 988 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 988, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_73_output_0", "outputIndexes": [ 989 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 969, 989 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_48_output_0", "outputIndexes": [ 990 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 574669184, 1310742, 327680, 0, 0 ] } , "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": [ 3714 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3714 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3715 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3715 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 991 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_290_output_0", "outputIndexes": [ 992 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 963, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_291_output_0", "outputIndexes": [ 993 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992, 993, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_118_output_0", "outputIndexes": [ 994 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 991, 994 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_83_output_0", "outputIndexes": [ 995 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 995 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 576307606, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_9/Mul_1_output_0", "outputIndexes": [ 997 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_74_output_0", "outputIndexes": [ 998 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997 ] , "main_type": "NONE", "name": "/Shape_129_output_0", "outputIndexes": [ 999 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 999 ] , "main_type": "NONE", "name": "Shape3762", "outputIndexes": [ 1000 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 999 ] , "main_type": "NONE", "name": "Rank3764", "outputIndexes": [ 1001 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1001, 1001 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3766", "outputIndexes": [ 1002 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3767", "outputIndexes": [ 1003 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1002, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3769", "outputIndexes": [ 1004 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3770", "outputIndexes": [ 1005 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1000, 1003, 1005, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3773", "outputIndexes": [ 1006 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1006 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3774", "outputIndexes": [ 1007 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1007 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3775", "outputIndexes": [ 1008 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1008, 1007 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3776", "outputIndexes": [ 1009 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 999, 1009, 1002 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_144_output_0", "outputIndexes": [ 1010 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1010, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_28_output_0", "outputIndexes": [ 1011 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1011, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_297_output_0", "outputIndexes": [ 1012 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 1012, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_39_output_0", "outputIndexes": [ 1013 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1013 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_19_output_0", "outputIndexes": [ 1014 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1011, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_296_output_0", "outputIndexes": [ 1015 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 997, 22, 1015, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_38_output_0", "outputIndexes": [ 1016 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1014, 1016 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_121_output_0", "outputIndexes": [ 1017 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_75_output_0", "outputIndexes": [ 1018 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 998, 1018 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_49_output_0", "outputIndexes": [ 1019 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3709 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 576308630, 1310742, 327680, 0, 0 ] } , "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": [ 3718 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3718 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3719 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3719 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1020 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_292_output_0", "outputIndexes": [ 1021 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 963, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_293_output_0", "outputIndexes": [ 1022 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1021, 1022, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_119_output_0", "outputIndexes": [ 1023 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1020, 1023 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_84_output_0", "outputIndexes": [ 1024 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 990, 1019, 1024, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_89_output_0", "outputIndexes": [ 1025 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3720 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3720 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3721 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3721 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 577947052, 5242902, 1310720, 0, 0 ] } , "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": [ 3722 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3722 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3723 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3723 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1026 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 1026 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_51_output_0", "outputIndexes": [ 1027 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 584500674, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_9/Mul_1_output_0", "outputIndexes": [ 1028 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3724 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3724 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3725 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3725 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 584521154, 12451862, 3112960, 0, 0 ] } , "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": [ 3726 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3726 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3727 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3727 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1029 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_9/Mul_output_0", "outputIndexes": [ 1030 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3725 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 600085976, 12451862, 3112960, 0, 0 ] } , "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": [ 3730 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3730 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3731 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3731 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1031 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1030, 1031 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_9/Mul_output_0", "outputIndexes": [ 1032 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1032 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3732 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3732 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3733 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3733 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 615650798, 12451862, 3112960, 0, 0 ] } , "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": [ 3734 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3734 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3735 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3735 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1033 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027, 1033 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_52_output_0", "outputIndexes": [ 1034 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1034, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_90_output_0", "outputIndexes": [ 1035 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 631215620, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_10/Mul_1_output_0", "outputIndexes": [ 1036 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3736 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3736 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3737 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3737 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 631236100, 5242902, 1310720, 0, 0 ] } , "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": [ 3738 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3738 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3739 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3739 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1037 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036 ] , "main_type": "NONE", "name": "/Shape_140_output_0", "outputIndexes": [ 1038 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1038 ] , "main_type": "NONE", "name": "Shape4105", "outputIndexes": [ 1039 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1038 ] , "main_type": "NONE", "name": "Rank4107", "outputIndexes": [ 1040 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1040, 1040 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4109", "outputIndexes": [ 1041 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1041 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4110", "outputIndexes": [ 1042 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1041, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4112", "outputIndexes": [ 1043 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1043 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4113", "outputIndexes": [ 1044 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1039, 1042, 1044, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4116", "outputIndexes": [ 1045 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1045 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4117", "outputIndexes": [ 1046 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 1046 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4119", "outputIndexes": [ 1047 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 1047, 1041 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_156_output_0", "outputIndexes": [ 1048 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_320_output_0", "outputIndexes": [ 1049 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1041 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4127", "outputIndexes": [ 1050 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1043 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4130", "outputIndexes": [ 1051 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1039, 1050, 1051, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4133", "outputIndexes": [ 1052 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1052 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4134", "outputIndexes": [ 1053 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1053 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4135", "outputIndexes": [ 1054 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054, 1053 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4136", "outputIndexes": [ 1055 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 1055, 1041 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_157_output_0", "outputIndexes": [ 1056 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_321_output_0", "outputIndexes": [ 1057 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 1057, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_130_output_0", "outputIndexes": [ 1058 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1037, 1058 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_91_output_0", "outputIndexes": [ 1059 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1059 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 637789722, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_10/Mul_1_output_0", "outputIndexes": [ 1061 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_80_output_0", "outputIndexes": [ 1062 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061 ] , "main_type": "NONE", "name": "/Shape_142_output_0", "outputIndexes": [ 1063 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1063 ] , "main_type": "NONE", "name": "Shape4255", "outputIndexes": [ 1064 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1063 ] , "main_type": "NONE", "name": "Rank4257", "outputIndexes": [ 1065 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1065, 1065 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4259", "outputIndexes": [ 1066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1066 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4260", "outputIndexes": [ 1067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1066, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4262", "outputIndexes": [ 1068 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1068 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4263", "outputIndexes": [ 1069 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1064, 1067, 1069, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4266", "outputIndexes": [ 1070 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1070 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4267", "outputIndexes": [ 1071 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1071 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4268", "outputIndexes": [ 1072 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1072, 1071 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4269", "outputIndexes": [ 1073 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063, 1073, 1066 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_158_output_0", "outputIndexes": [ 1074 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1074, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_30_output_0", "outputIndexes": [ 1075 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_327_output_0", "outputIndexes": [ 1076 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061, 1076, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_41_output_0", "outputIndexes": [ 1077 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1077 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_20_output_0", "outputIndexes": [ 1078 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1075, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_326_output_0", "outputIndexes": [ 1079 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1061, 22, 1079, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_40_output_0", "outputIndexes": [ 1080 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078, 1080 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_133_output_0", "outputIndexes": [ 1081 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1081, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_81_output_0", "outputIndexes": [ 1082 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1062, 1082 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_53_output_0", "outputIndexes": [ 1083 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3737 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 637790746, 1310742, 327680, 0, 0 ] } , "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": [ 3742 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3742 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3743 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3743 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1084 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_322_output_0", "outputIndexes": [ 1085 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_323_output_0", "outputIndexes": [ 1086 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1085, 1086, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_131_output_0", "outputIndexes": [ 1087 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1084, 1087 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_92_output_0", "outputIndexes": [ 1088 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1088 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 639429168, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_10/Mul_1_output_0", "outputIndexes": [ 1090 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_82_output_0", "outputIndexes": [ 1091 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090 ] , "main_type": "NONE", "name": "/Shape_143_output_0", "outputIndexes": [ 1092 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1092 ] , "main_type": "NONE", "name": "Shape4151", "outputIndexes": [ 1093 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1092 ] , "main_type": "NONE", "name": "Rank4153", "outputIndexes": [ 1094 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1094, 1094 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4155", "outputIndexes": [ 1095 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4156", "outputIndexes": [ 1096 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1095, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4158", "outputIndexes": [ 1097 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1097 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4159", "outputIndexes": [ 1098 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1093, 1096, 1098, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4162", "outputIndexes": [ 1099 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1099 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4163", "outputIndexes": [ 1100 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1100 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4164", "outputIndexes": [ 1101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1101, 1100 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4165", "outputIndexes": [ 1102 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1092, 1102, 1095 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_159_output_0", "outputIndexes": [ 1103 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1103, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_31_output_0", "outputIndexes": [ 1104 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1104, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_329_output_0", "outputIndexes": [ 1105 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 1105, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_43_output_0", "outputIndexes": [ 1106 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_21_output_0", "outputIndexes": [ 1107 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1104, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_328_output_0", "outputIndexes": [ 1108 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 22, 1108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_42_output_0", "outputIndexes": [ 1109 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1107, 1109 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_134_output_0", "outputIndexes": [ 1110 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1110, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_83_output_0", "outputIndexes": [ 1111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1091, 1111 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_54_output_0", "outputIndexes": [ 1112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3737 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 639430192, 1310742, 327680, 0, 0 ] } , "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": [ 3746 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3746 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3747 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3747 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1113 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1048, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_324_output_0", "outputIndexes": [ 1114 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_325_output_0", "outputIndexes": [ 1115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1114, 1115, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_132_output_0", "outputIndexes": [ 1116 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1113, 1116 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_93_output_0", "outputIndexes": [ 1117 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083, 1112, 1117, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_98_output_0", "outputIndexes": [ 1118 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3748 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3748 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3749 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3749 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 641068614, 5242902, 1310720, 0, 0 ] } , "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": [ 3750 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3750 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3751 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3751 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1119 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035, 1119 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_56_output_0", "outputIndexes": [ 1120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 647622236, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_10/Mul_1_output_0", "outputIndexes": [ 1121 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1121 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3752 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3752 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3753 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 647642716, 12451862, 3112960, 0, 0 ] } , "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": [ 3754 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3754 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3755 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3755 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1122 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_10/Mul_output_0", "outputIndexes": [ 1123 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3753 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 663207538, 12451862, 3112960, 0, 0 ] } , "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": [ 3758 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3758 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3759 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3759 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1124 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1123, 1124 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_10/Mul_output_0", "outputIndexes": [ 1125 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1125 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3760 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3760 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3761 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3761 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 678772360, 12451862, 3112960, 0, 0 ] } , "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": [ 3762 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3762 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3763 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3763 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1126 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120, 1126 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_57_output_0", "outputIndexes": [ 1127 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_99_output_0", "outputIndexes": [ 1128 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1128 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 694337182, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_11/Mul_1_output_0", "outputIndexes": [ 1129 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3764 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3764 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3765 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3765 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 694357662, 5242902, 1310720, 0, 0 ] } , "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": [ 3766 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3766 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3767 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3767 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1130 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1129 ] , "main_type": "NONE", "name": "/Shape_154_output_0", "outputIndexes": [ 1131 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1131 ] , "main_type": "NONE", "name": "Shape4494", "outputIndexes": [ 1132 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1131 ] , "main_type": "NONE", "name": "Rank4496", "outputIndexes": [ 1133 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1133, 1133 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4498", "outputIndexes": [ 1134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1134 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4499", "outputIndexes": [ 1135 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1134, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4501", "outputIndexes": [ 1136 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1136 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4502", "outputIndexes": [ 1137 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1132, 1135, 1137, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4505", "outputIndexes": [ 1138 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4506", "outputIndexes": [ 1139 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1139, 1139 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4508", "outputIndexes": [ 1140 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1131, 1140, 1134 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_171_output_0", "outputIndexes": [ 1141 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_352_output_0", "outputIndexes": [ 1142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1134 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4516", "outputIndexes": [ 1143 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1136 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4519", "outputIndexes": [ 1144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1132, 1143, 1144, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4522", "outputIndexes": [ 1145 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1145 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4523", "outputIndexes": [ 1146 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1146 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4524", "outputIndexes": [ 1147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1147, 1146 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4525", "outputIndexes": [ 1148 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1131, 1148, 1134 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_172_output_0", "outputIndexes": [ 1149 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_353_output_0", "outputIndexes": [ 1150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1142, 1150, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_143_output_0", "outputIndexes": [ 1151 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1130, 1151 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_100_output_0", "outputIndexes": [ 1152 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 700911284, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_11/Mul_1_output_0", "outputIndexes": [ 1154 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_88_output_0", "outputIndexes": [ 1155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154 ] , "main_type": "NONE", "name": "/Shape_156_output_0", "outputIndexes": [ 1156 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1156 ] , "main_type": "NONE", "name": "Shape4644", "outputIndexes": [ 1157 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1156 ] , "main_type": "NONE", "name": "Rank4646", "outputIndexes": [ 1158 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1158, 1158 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4648", "outputIndexes": [ 1159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1159 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4649", "outputIndexes": [ 1160 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1159, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4651", "outputIndexes": [ 1161 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1161 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4652", "outputIndexes": [ 1162 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1157, 1160, 1162, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4655", "outputIndexes": [ 1163 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1163 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4656", "outputIndexes": [ 1164 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1164 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4657", "outputIndexes": [ 1165 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1164 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4658", "outputIndexes": [ 1166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1156, 1166, 1159 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_173_output_0", "outputIndexes": [ 1167 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_33_output_0", "outputIndexes": [ 1168 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_359_output_0", "outputIndexes": [ 1169 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 1169, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_45_output_0", "outputIndexes": [ 1170 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_22_output_0", "outputIndexes": [ 1171 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_358_output_0", "outputIndexes": [ 1172 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154, 22, 1172, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_44_output_0", "outputIndexes": [ 1173 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1171, 1173 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_146_output_0", "outputIndexes": [ 1174 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1174, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_89_output_0", "outputIndexes": [ 1175 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1155, 1175 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_58_output_0", "outputIndexes": [ 1176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3765 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 700912308, 1310742, 327680, 0, 0 ] } , "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": [ 3770 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3770 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3771 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3771 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1177 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_354_output_0", "outputIndexes": [ 1178 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_355_output_0", "outputIndexes": [ 1179 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1178, 1179, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_144_output_0", "outputIndexes": [ 1180 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1177, 1180 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_101_output_0", "outputIndexes": [ 1181 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 702550730, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_11/Mul_1_output_0", "outputIndexes": [ 1183 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_90_output_0", "outputIndexes": [ 1184 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183 ] , "main_type": "NONE", "name": "/Shape_157_output_0", "outputIndexes": [ 1185 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1185 ] , "main_type": "NONE", "name": "Shape4540", "outputIndexes": [ 1186 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1185 ] , "main_type": "NONE", "name": "Rank4542", "outputIndexes": [ 1187 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1187, 1187 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4544", "outputIndexes": [ 1188 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4545", "outputIndexes": [ 1189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4547", "outputIndexes": [ 1190 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1190 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4548", "outputIndexes": [ 1191 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1186, 1189, 1191, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4551", "outputIndexes": [ 1192 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1192 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4552", "outputIndexes": [ 1193 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1193 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4553", "outputIndexes": [ 1194 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1194, 1193 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4554", "outputIndexes": [ 1195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1185, 1195, 1188 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_174_output_0", "outputIndexes": [ 1196 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1196, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_34_output_0", "outputIndexes": [ 1197 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_361_output_0", "outputIndexes": [ 1198 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183, 1198, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_47_output_0", "outputIndexes": [ 1199 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1199 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_23_output_0", "outputIndexes": [ 1200 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_360_output_0", "outputIndexes": [ 1201 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1183, 22, 1201, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_46_output_0", "outputIndexes": [ 1202 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1200, 1202 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_147_output_0", "outputIndexes": [ 1203 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_91_output_0", "outputIndexes": [ 1204 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1184, 1204 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_59_output_0", "outputIndexes": [ 1205 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3765 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 702551754, 1310742, 327680, 0, 0 ] } , "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": [ 3774 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3774 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3775 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3775 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1206 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_356_output_0", "outputIndexes": [ 1207 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_357_output_0", "outputIndexes": [ 1208 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1208, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_145_output_0", "outputIndexes": [ 1209 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1209 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_102_output_0", "outputIndexes": [ 1210 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1176, 1205, 1210, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_107_output_0", "outputIndexes": [ 1211 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3776 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3776 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3777 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3777 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 704190176, 5242902, 1310720, 0, 0 ] } , "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": [ 3778 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3778 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3779 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3779 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1212 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1128, 1212 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_61_output_0", "outputIndexes": [ 1213 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 710743798, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_11/Mul_1_output_0", "outputIndexes": [ 1214 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1214 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3780 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3780 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3781 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3781 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 710764278, 12451862, 3112960, 0, 0 ] } , "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": [ 3782 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3782 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3783 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3783 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1215 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1215 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_11/Mul_output_0", "outputIndexes": [ 1216 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3781 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 726329100, 12451862, 3112960, 0, 0 ] } , "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": [ 3786 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3786 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3787 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3787 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1217 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 1217 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_11/Mul_output_0", "outputIndexes": [ 1218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1218 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3788 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3788 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3789 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3789 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 741893922, 12451862, 3112960, 0, 0 ] } , "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": [ 3790 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3790 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3791 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3791 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1219 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213, 1219 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_62_output_0", "outputIndexes": [ 1220 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1220, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_108_output_0", "outputIndexes": [ 1221 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1221 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 757458744, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_12/Mul_1_output_0", "outputIndexes": [ 1222 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3792 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3792 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3793 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 757479224, 5242902, 1310720, 0, 0 ] } , "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": [ 3794 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3794 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3795 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3795 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1223 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222 ] , "main_type": "NONE", "name": "/Shape_168_output_0", "outputIndexes": [ 1224 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1224 ] , "main_type": "NONE", "name": "Shape4883", "outputIndexes": [ 1225 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1224 ] , "main_type": "NONE", "name": "Rank4885", "outputIndexes": [ 1226 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1226, 1226 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4887", "outputIndexes": [ 1227 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4888", "outputIndexes": [ 1228 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4890", "outputIndexes": [ 1229 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4891", "outputIndexes": [ 1230 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1225, 1228, 1230, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4894", "outputIndexes": [ 1231 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1231 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4895", "outputIndexes": [ 1232 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232, 1232 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4897", "outputIndexes": [ 1233 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 1233, 1227 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_186_output_0", "outputIndexes": [ 1234 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_384_output_0", "outputIndexes": [ 1235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4905", "outputIndexes": [ 1236 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4908", "outputIndexes": [ 1237 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1225, 1236, 1237, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4911", "outputIndexes": [ 1238 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1238 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4912", "outputIndexes": [ 1239 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1239 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4913", "outputIndexes": [ 1240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240, 1239 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4914", "outputIndexes": [ 1241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 1241, 1227 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_187_output_0", "outputIndexes": [ 1242 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1242, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_385_output_0", "outputIndexes": [ 1243 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1235, 1243, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_156_output_0", "outputIndexes": [ 1244 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1223, 1244 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_109_output_0", "outputIndexes": [ 1245 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1245 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 764032846, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_12/Mul_1_output_0", "outputIndexes": [ 1247 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_96_output_0", "outputIndexes": [ 1248 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247 ] , "main_type": "NONE", "name": "/Shape_170_output_0", "outputIndexes": [ 1249 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1249 ] , "main_type": "NONE", "name": "Shape5033", "outputIndexes": [ 1250 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1249 ] , "main_type": "NONE", "name": "Rank5035", "outputIndexes": [ 1251 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1251, 1251 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5037", "outputIndexes": [ 1252 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1252 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5038", "outputIndexes": [ 1253 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1252, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5040", "outputIndexes": [ 1254 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5041", "outputIndexes": [ 1255 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1250, 1253, 1255, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5044", "outputIndexes": [ 1256 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5045", "outputIndexes": [ 1257 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1257 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5046", "outputIndexes": [ 1258 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258, 1257 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5047", "outputIndexes": [ 1259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249, 1259, 1252 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_188_output_0", "outputIndexes": [ 1260 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1260, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_36_output_0", "outputIndexes": [ 1261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_391_output_0", "outputIndexes": [ 1262 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247, 1262, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_49_output_0", "outputIndexes": [ 1263 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1263 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_24_output_0", "outputIndexes": [ 1264 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_390_output_0", "outputIndexes": [ 1265 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247, 22, 1265, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_48_output_0", "outputIndexes": [ 1266 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1264, 1266 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_159_output_0", "outputIndexes": [ 1267 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1267, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_97_output_0", "outputIndexes": [ 1268 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1248, 1268 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_63_output_0", "outputIndexes": [ 1269 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 764033870, 1310742, 327680, 0, 0 ] } , "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": [ 3798 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3798 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3799 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3799 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1270 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_386_output_0", "outputIndexes": [ 1271 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1242, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_387_output_0", "outputIndexes": [ 1272 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271, 1272, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_157_output_0", "outputIndexes": [ 1273 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1270, 1273 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_110_output_0", "outputIndexes": [ 1274 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1274 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 765672292, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_12/Mul_1_output_0", "outputIndexes": [ 1276 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_98_output_0", "outputIndexes": [ 1277 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276 ] , "main_type": "NONE", "name": "/Shape_171_output_0", "outputIndexes": [ 1278 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1278 ] , "main_type": "NONE", "name": "Shape4929", "outputIndexes": [ 1279 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1278 ] , "main_type": "NONE", "name": "Rank4931", "outputIndexes": [ 1280 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1280, 1280 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4933", "outputIndexes": [ 1281 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1281 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4934", "outputIndexes": [ 1282 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1281, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4936", "outputIndexes": [ 1283 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1283 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4937", "outputIndexes": [ 1284 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1279, 1282, 1284, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4940", "outputIndexes": [ 1285 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1285 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4941", "outputIndexes": [ 1286 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1286 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4942", "outputIndexes": [ 1287 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1287, 1286 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4943", "outputIndexes": [ 1288 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1278, 1288, 1281 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_189_output_0", "outputIndexes": [ 1289 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1289, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_37_output_0", "outputIndexes": [ 1290 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1290, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_393_output_0", "outputIndexes": [ 1291 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 1291, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_51_output_0", "outputIndexes": [ 1292 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1292 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_25_output_0", "outputIndexes": [ 1293 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1290, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_392_output_0", "outputIndexes": [ 1294 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1276, 22, 1294, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_50_output_0", "outputIndexes": [ 1295 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1293, 1295 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_160_output_0", "outputIndexes": [ 1296 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1296, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_99_output_0", "outputIndexes": [ 1297 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1277, 1297 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_64_output_0", "outputIndexes": [ 1298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3793 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 765673316, 1310742, 327680, 0, 0 ] } , "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": [ 3802 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3802 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3803 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3803 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1299 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_388_output_0", "outputIndexes": [ 1300 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1242, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_389_output_0", "outputIndexes": [ 1301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300, 1301, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_158_output_0", "outputIndexes": [ 1302 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1299, 1302 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_111_output_0", "outputIndexes": [ 1303 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1269, 1298, 1303, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_116_output_0", "outputIndexes": [ 1304 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1304 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3804 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3804 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3805 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3805 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 767311738, 5242902, 1310720, 0, 0 ] } , "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": [ 3806 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3806 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3807 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3807 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1305 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1221, 1305 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_66_output_0", "outputIndexes": [ 1306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1306 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 773865360, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_12/Mul_1_output_0", "outputIndexes": [ 1307 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1307 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3808 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3808 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3809 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3809 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 773885840, 12451862, 3112960, 0, 0 ] } , "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": [ 3810 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3810 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3811 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3811 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1308 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1308 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_12/Mul_output_0", "outputIndexes": [ 1309 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3809 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 789450662, 12451862, 3112960, 0, 0 ] } , "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": [ 3814 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3814 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3815 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3815 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1310 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1309, 1310 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_12/Mul_output_0", "outputIndexes": [ 1311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1311 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3816 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3816 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3817 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3817 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 805015484, 12451862, 3112960, 0, 0 ] } , "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": [ 3818 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3818 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3819 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3819 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1312 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1306, 1312 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_67_output_0", "outputIndexes": [ 1313 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_117_output_0", "outputIndexes": [ 1314 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1314 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 820580306, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_13/Mul_1_output_0", "outputIndexes": [ 1315 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3820 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3820 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3821 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3821 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 820600786, 5242902, 1310720, 0, 0 ] } , "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": [ 3822 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3822 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3823 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3823 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1316 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1315 ] , "main_type": "NONE", "name": "/Shape_182_output_0", "outputIndexes": [ 1317 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1317 ] , "main_type": "NONE", "name": "Shape5272", "outputIndexes": [ 1318 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1317 ] , "main_type": "NONE", "name": "Rank5274", "outputIndexes": [ 1319 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1319, 1319 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5276", "outputIndexes": [ 1320 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5277", "outputIndexes": [ 1321 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5279", "outputIndexes": [ 1322 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1322 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5280", "outputIndexes": [ 1323 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 1321, 1323, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5283", "outputIndexes": [ 1324 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1324 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5284", "outputIndexes": [ 1325 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1325, 1325 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5286", "outputIndexes": [ 1326 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317, 1326, 1320 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_201_output_0", "outputIndexes": [ 1327 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_416_output_0", "outputIndexes": [ 1328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5294", "outputIndexes": [ 1329 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1322 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5297", "outputIndexes": [ 1330 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 1329, 1330, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5300", "outputIndexes": [ 1331 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1331 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5301", "outputIndexes": [ 1332 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1332 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5302", "outputIndexes": [ 1333 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1333, 1332 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5303", "outputIndexes": [ 1334 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317, 1334, 1320 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_202_output_0", "outputIndexes": [ 1335 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_417_output_0", "outputIndexes": [ 1336 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1328, 1336, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_169_output_0", "outputIndexes": [ 1337 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 1337 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_118_output_0", "outputIndexes": [ 1338 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1338 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 827154408, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_13/Mul_1_output_0", "outputIndexes": [ 1340 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_104_output_0", "outputIndexes": [ 1341 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340 ] , "main_type": "NONE", "name": "/Shape_184_output_0", "outputIndexes": [ 1342 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1342 ] , "main_type": "NONE", "name": "Shape5422", "outputIndexes": [ 1343 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1342 ] , "main_type": "NONE", "name": "Rank5424", "outputIndexes": [ 1344 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1344, 1344 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5426", "outputIndexes": [ 1345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5427", "outputIndexes": [ 1346 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5429", "outputIndexes": [ 1347 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1347 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5430", "outputIndexes": [ 1348 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 1346, 1348, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5433", "outputIndexes": [ 1349 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1349 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5434", "outputIndexes": [ 1350 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1350 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5435", "outputIndexes": [ 1351 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1351, 1350 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5436", "outputIndexes": [ 1352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1342, 1352, 1345 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_203_output_0", "outputIndexes": [ 1353 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1353, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_39_output_0", "outputIndexes": [ 1354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_423_output_0", "outputIndexes": [ 1355 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 1355, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_53_output_0", "outputIndexes": [ 1356 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1356 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_26_output_0", "outputIndexes": [ 1357 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_422_output_0", "outputIndexes": [ 1358 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 22, 1358, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_52_output_0", "outputIndexes": [ 1359 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1357, 1359 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_172_output_0", "outputIndexes": [ 1360 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1360, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_105_output_0", "outputIndexes": [ 1361 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1341, 1361 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_68_output_0", "outputIndexes": [ 1362 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3821 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 827155432, 1310742, 327680, 0, 0 ] } , "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": [ 3826 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3826 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3827 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3827 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1363 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_418_output_0", "outputIndexes": [ 1364 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_419_output_0", "outputIndexes": [ 1365 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1364, 1365, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_170_output_0", "outputIndexes": [ 1366 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1363, 1366 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_119_output_0", "outputIndexes": [ 1367 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1367 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 828793854, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_13/Mul_1_output_0", "outputIndexes": [ 1369 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_106_output_0", "outputIndexes": [ 1370 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369 ] , "main_type": "NONE", "name": "/Shape_185_output_0", "outputIndexes": [ 1371 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1371 ] , "main_type": "NONE", "name": "Shape5318", "outputIndexes": [ 1372 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1371 ] , "main_type": "NONE", "name": "Rank5320", "outputIndexes": [ 1373 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1373, 1373 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5322", "outputIndexes": [ 1374 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5323", "outputIndexes": [ 1375 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5325", "outputIndexes": [ 1376 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1376 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5326", "outputIndexes": [ 1377 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1372, 1375, 1377, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5329", "outputIndexes": [ 1378 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1378 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5330", "outputIndexes": [ 1379 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1379 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5331", "outputIndexes": [ 1380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1380, 1379 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5332", "outputIndexes": [ 1381 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1371, 1381, 1374 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_204_output_0", "outputIndexes": [ 1382 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_40_output_0", "outputIndexes": [ 1383 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_425_output_0", "outputIndexes": [ 1384 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 1384, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_55_output_0", "outputIndexes": [ 1385 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_27_output_0", "outputIndexes": [ 1386 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_424_output_0", "outputIndexes": [ 1387 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1369, 22, 1387, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_54_output_0", "outputIndexes": [ 1388 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1386, 1388 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_173_output_0", "outputIndexes": [ 1389 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_107_output_0", "outputIndexes": [ 1390 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1370, 1390 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_69_output_0", "outputIndexes": [ 1391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3821 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 828794878, 1310742, 327680, 0, 0 ] } , "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": [ 3830 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3830 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3831 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3831 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1392 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_420_output_0", "outputIndexes": [ 1393 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1335, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_421_output_0", "outputIndexes": [ 1394 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1393, 1394, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_171_output_0", "outputIndexes": [ 1395 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1392, 1395 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_120_output_0", "outputIndexes": [ 1396 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1362, 1391, 1396, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_125_output_0", "outputIndexes": [ 1397 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1397 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3832 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3832 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3833 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3833 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 830433300, 5242902, 1310720, 0, 0 ] } , "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": [ 3834 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3834 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3835 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3835 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1398 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1314, 1398 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_71_output_0", "outputIndexes": [ 1399 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1399 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 836986922, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_13/Mul_1_output_0", "outputIndexes": [ 1400 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1400 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3836 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3836 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3837 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3837 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 837007402, 12451862, 3112960, 0, 0 ] } , "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": [ 3838 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3838 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3839 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3839 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1401 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1401 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_13/Mul_output_0", "outputIndexes": [ 1402 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3837 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 852572224, 12451862, 3112960, 0, 0 ] } , "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": [ 3842 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3842 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3843 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3843 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1403 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 1403 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_13/Mul_output_0", "outputIndexes": [ 1404 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1404 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3844 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3844 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3845 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3845 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 868137046, 12451862, 3112960, 0, 0 ] } , "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": [ 3846 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3846 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3847 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3847 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1405 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1399, 1405 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_72_output_0", "outputIndexes": [ 1406 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1406, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_126_output_0", "outputIndexes": [ 1407 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 883701868, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_14/Mul_1_output_0", "outputIndexes": [ 1408 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3848 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3848 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3849 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3849 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 883722348, 5242902, 1310720, 0, 0 ] } , "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": [ 3850 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3850 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3851 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3851 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1409 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408 ] , "main_type": "NONE", "name": "/Shape_196_output_0", "outputIndexes": [ 1410 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1410 ] , "main_type": "NONE", "name": "Shape5661", "outputIndexes": [ 1411 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1410 ] , "main_type": "NONE", "name": "Rank5663", "outputIndexes": [ 1412 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412, 1412 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5665", "outputIndexes": [ 1413 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1413 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5666", "outputIndexes": [ 1414 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1413, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5668", "outputIndexes": [ 1415 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1415 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5669", "outputIndexes": [ 1416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1411, 1414, 1416, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5672", "outputIndexes": [ 1417 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1417 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5673", "outputIndexes": [ 1418 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1418, 1418 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5675", "outputIndexes": [ 1419 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410, 1419, 1413 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_216_output_0", "outputIndexes": [ 1420 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1420, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_448_output_0", "outputIndexes": [ 1421 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1413 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5683", "outputIndexes": [ 1422 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1415 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5686", "outputIndexes": [ 1423 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1411, 1422, 1423, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5689", "outputIndexes": [ 1424 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1424 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5690", "outputIndexes": [ 1425 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1425 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5691", "outputIndexes": [ 1426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1426, 1425 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5692", "outputIndexes": [ 1427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410, 1427, 1413 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_217_output_0", "outputIndexes": [ 1428 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_449_output_0", "outputIndexes": [ 1429 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421, 1429, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_182_output_0", "outputIndexes": [ 1430 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1409, 1430 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_127_output_0", "outputIndexes": [ 1431 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1431 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 890275970, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_14/Mul_1_output_0", "outputIndexes": [ 1433 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_112_output_0", "outputIndexes": [ 1434 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433 ] , "main_type": "NONE", "name": "/Shape_198_output_0", "outputIndexes": [ 1435 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1435 ] , "main_type": "NONE", "name": "Shape5811", "outputIndexes": [ 1436 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1435 ] , "main_type": "NONE", "name": "Rank5813", "outputIndexes": [ 1437 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1437, 1437 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5815", "outputIndexes": [ 1438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1438 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5816", "outputIndexes": [ 1439 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1438, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5818", "outputIndexes": [ 1440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1440 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5819", "outputIndexes": [ 1441 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 1439, 1441, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5822", "outputIndexes": [ 1442 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1442 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5823", "outputIndexes": [ 1443 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1443 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5824", "outputIndexes": [ 1444 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1444, 1443 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5825", "outputIndexes": [ 1445 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1435, 1445, 1438 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_218_output_0", "outputIndexes": [ 1446 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1446, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_42_output_0", "outputIndexes": [ 1447 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1447, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_455_output_0", "outputIndexes": [ 1448 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433, 1448, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_57_output_0", "outputIndexes": [ 1449 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1449 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_28_output_0", "outputIndexes": [ 1450 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1447, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_454_output_0", "outputIndexes": [ 1451 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433, 22, 1451, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_56_output_0", "outputIndexes": [ 1452 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1450, 1452 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_185_output_0", "outputIndexes": [ 1453 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1453, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_113_output_0", "outputIndexes": [ 1454 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 1454 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_73_output_0", "outputIndexes": [ 1455 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3849 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 890276994, 1310742, 327680, 0, 0 ] } , "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": [ 3854 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3854 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3855 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3855 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1456 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1420, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_450_output_0", "outputIndexes": [ 1457 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_451_output_0", "outputIndexes": [ 1458 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1457, 1458, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_183_output_0", "outputIndexes": [ 1459 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1456, 1459 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_128_output_0", "outputIndexes": [ 1460 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1460 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 891915416, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_14/Mul_1_output_0", "outputIndexes": [ 1462 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_114_output_0", "outputIndexes": [ 1463 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462 ] , "main_type": "NONE", "name": "/Shape_199_output_0", "outputIndexes": [ 1464 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1464 ] , "main_type": "NONE", "name": "Shape5707", "outputIndexes": [ 1465 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1464 ] , "main_type": "NONE", "name": "Rank5709", "outputIndexes": [ 1466 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1466, 1466 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5711", "outputIndexes": [ 1467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5712", "outputIndexes": [ 1468 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5714", "outputIndexes": [ 1469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1469 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5715", "outputIndexes": [ 1470 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1465, 1468, 1470, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5718", "outputIndexes": [ 1471 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5719", "outputIndexes": [ 1472 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1472 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5720", "outputIndexes": [ 1473 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473, 1472 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5721", "outputIndexes": [ 1474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1464, 1474, 1467 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_219_output_0", "outputIndexes": [ 1475 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1475, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_43_output_0", "outputIndexes": [ 1476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_457_output_0", "outputIndexes": [ 1477 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 1477, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_59_output_0", "outputIndexes": [ 1478 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_29_output_0", "outputIndexes": [ 1479 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_456_output_0", "outputIndexes": [ 1480 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 22, 1480, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_58_output_0", "outputIndexes": [ 1481 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1479, 1481 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_186_output_0", "outputIndexes": [ 1482 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1482, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_115_output_0", "outputIndexes": [ 1483 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1463, 1483 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_74_output_0", "outputIndexes": [ 1484 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3849 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 891916440, 1310742, 327680, 0, 0 ] } , "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": [ 3858 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3858 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3859 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3859 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1485 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1420, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_452_output_0", "outputIndexes": [ 1486 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_453_output_0", "outputIndexes": [ 1487 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1486, 1487, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_184_output_0", "outputIndexes": [ 1488 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1485, 1488 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_129_output_0", "outputIndexes": [ 1489 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1455, 1484, 1489, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_134_output_0", "outputIndexes": [ 1490 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1490 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3860 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3860 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3861 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3861 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 893554862, 5242902, 1310720, 0, 0 ] } , "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": [ 3862 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3862 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3863 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3863 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1491 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 1491 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_76_output_0", "outputIndexes": [ 1492 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1492 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 900108484, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_14/Mul_1_output_0", "outputIndexes": [ 1493 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1493 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3864 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3864 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3865 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3865 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 900128964, 12451862, 3112960, 0, 0 ] } , "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": [ 3866 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3866 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3867 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3867 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1494 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_14/Mul_output_0", "outputIndexes": [ 1495 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3865 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 915693786, 12451862, 3112960, 0, 0 ] } , "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": [ 3870 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3870 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3871 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3871 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1496 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1495, 1496 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_14/Mul_output_0", "outputIndexes": [ 1497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3872 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3872 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3873 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3873 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 931258608, 12451862, 3112960, 0, 0 ] } , "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": [ 3874 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3874 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3875 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3875 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1498 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1492, 1498 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_77_output_0", "outputIndexes": [ 1499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_135_output_0", "outputIndexes": [ 1500 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1500 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 946823430, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_15/Mul_1_output_0", "outputIndexes": [ 1501 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3876 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3876 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3877 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3877 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 946843910, 5242902, 1310720, 0, 0 ] } , "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": [ 3878 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3878 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3879 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3879 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1502 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501 ] , "main_type": "NONE", "name": "/Shape_210_output_0", "outputIndexes": [ 1503 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1503 ] , "main_type": "NONE", "name": "Shape6050", "outputIndexes": [ 1504 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1503 ] , "main_type": "NONE", "name": "Rank6052", "outputIndexes": [ 1505 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1505, 1505 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6054", "outputIndexes": [ 1506 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1506 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6055", "outputIndexes": [ 1507 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1506, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6057", "outputIndexes": [ 1508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1508 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6058", "outputIndexes": [ 1509 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1504, 1507, 1509, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6061", "outputIndexes": [ 1510 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6062", "outputIndexes": [ 1511 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1511, 1511 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6064", "outputIndexes": [ 1512 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503, 1512, 1506 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_231_output_0", "outputIndexes": [ 1513 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_480_output_0", "outputIndexes": [ 1514 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1506 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6072", "outputIndexes": [ 1515 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1508 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6075", "outputIndexes": [ 1516 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1504, 1515, 1516, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6078", "outputIndexes": [ 1517 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1517 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6079", "outputIndexes": [ 1518 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1518 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6080", "outputIndexes": [ 1519 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1519, 1518 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6081", "outputIndexes": [ 1520 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503, 1520, 1506 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_232_output_0", "outputIndexes": [ 1521 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_481_output_0", "outputIndexes": [ 1522 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1514, 1522, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_195_output_0", "outputIndexes": [ 1523 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1502, 1523 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_136_output_0", "outputIndexes": [ 1524 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 953397532, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_15/Mul_1_output_0", "outputIndexes": [ 1526 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_120_output_0", "outputIndexes": [ 1527 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526 ] , "main_type": "NONE", "name": "/Shape_212_output_0", "outputIndexes": [ 1528 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1528 ] , "main_type": "NONE", "name": "Shape6200", "outputIndexes": [ 1529 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1528 ] , "main_type": "NONE", "name": "Rank6202", "outputIndexes": [ 1530 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1530, 1530 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6204", "outputIndexes": [ 1531 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1531 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6205", "outputIndexes": [ 1532 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1531, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6207", "outputIndexes": [ 1533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1533 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6208", "outputIndexes": [ 1534 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1529, 1532, 1534, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6211", "outputIndexes": [ 1535 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6212", "outputIndexes": [ 1536 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1536 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6213", "outputIndexes": [ 1537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537, 1536 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6214", "outputIndexes": [ 1538 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1528, 1538, 1531 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_233_output_0", "outputIndexes": [ 1539 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1539, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_45_output_0", "outputIndexes": [ 1540 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_487_output_0", "outputIndexes": [ 1541 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 1541, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_61_output_0", "outputIndexes": [ 1542 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1542 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_30_output_0", "outputIndexes": [ 1543 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1540, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_486_output_0", "outputIndexes": [ 1544 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 22, 1544, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_60_output_0", "outputIndexes": [ 1545 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1543, 1545 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_198_output_0", "outputIndexes": [ 1546 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1546, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_121_output_0", "outputIndexes": [ 1547 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1527, 1547 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_78_output_0", "outputIndexes": [ 1548 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3877 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 953398556, 1310742, 327680, 0, 0 ] } , "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": [ 3882 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3882 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3883 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3883 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1549 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_482_output_0", "outputIndexes": [ 1550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_483_output_0", "outputIndexes": [ 1551 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1550, 1551, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_196_output_0", "outputIndexes": [ 1552 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1549, 1552 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_137_output_0", "outputIndexes": [ 1553 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1553 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 955036978, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_15/Mul_1_output_0", "outputIndexes": [ 1555 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_122_output_0", "outputIndexes": [ 1556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555 ] , "main_type": "NONE", "name": "/Shape_213_output_0", "outputIndexes": [ 1557 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1557 ] , "main_type": "NONE", "name": "Shape6096", "outputIndexes": [ 1558 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1557 ] , "main_type": "NONE", "name": "Rank6098", "outputIndexes": [ 1559 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1559, 1559 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6100", "outputIndexes": [ 1560 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6101", "outputIndexes": [ 1561 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6103", "outputIndexes": [ 1562 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6104", "outputIndexes": [ 1563 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558, 1561, 1563, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6107", "outputIndexes": [ 1564 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6108", "outputIndexes": [ 1565 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1565 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6109", "outputIndexes": [ 1566 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1566, 1565 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6110", "outputIndexes": [ 1567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1557, 1567, 1560 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_234_output_0", "outputIndexes": [ 1568 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1568, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_46_output_0", "outputIndexes": [ 1569 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_489_output_0", "outputIndexes": [ 1570 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 1570, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_63_output_0", "outputIndexes": [ 1571 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1571 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_31_output_0", "outputIndexes": [ 1572 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_488_output_0", "outputIndexes": [ 1573 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1555, 22, 1573, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_62_output_0", "outputIndexes": [ 1574 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 1574 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_199_output_0", "outputIndexes": [ 1575 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1575, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_123_output_0", "outputIndexes": [ 1576 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1556, 1576 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_79_output_0", "outputIndexes": [ 1577 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3877 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 955038002, 1310742, 327680, 0, 0 ] } , "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": [ 3886 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3886 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3887 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3887 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1578 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1513, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_484_output_0", "outputIndexes": [ 1579 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_485_output_0", "outputIndexes": [ 1580 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1579, 1580, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_197_output_0", "outputIndexes": [ 1581 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1578, 1581 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_138_output_0", "outputIndexes": [ 1582 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1548, 1577, 1582, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_143_output_0", "outputIndexes": [ 1583 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3888 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3888 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3889 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3889 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 956676424, 5242902, 1310720, 0, 0 ] } , "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": [ 3890 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3890 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3891 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3891 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1584 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1500, 1584 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_81_output_0", "outputIndexes": [ 1585 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 963230046, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_15/Mul_1_output_0", "outputIndexes": [ 1586 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1586 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3892 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3892 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3893 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3893 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 963250526, 12451862, 3112960, 0, 0 ] } , "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": [ 3894 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3894 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3895 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3895 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1587 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1587 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_15/Mul_output_0", "outputIndexes": [ 1588 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3893 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 978815348, 12451862, 3112960, 0, 0 ] } , "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": [ 3898 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3898 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3899 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3899 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1589 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1588, 1589 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_15/Mul_output_0", "outputIndexes": [ 1590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3900 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3900 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3901 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3901 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 994380170, 12451862, 3112960, 0, 0 ] } , "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": [ 3902 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3902 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3903 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3903 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1591 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585, 1591 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_82_output_0", "outputIndexes": [ 1592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1592, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_144_output_0", "outputIndexes": [ 1593 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1593 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1009944992, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_16/Mul_1_output_0", "outputIndexes": [ 1594 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3904 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3904 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3905 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3905 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1009965472, 5242902, 1310720, 0, 0 ] } , "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": [ 3906 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3906 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3907 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3907 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1595 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594 ] , "main_type": "NONE", "name": "/Shape_224_output_0", "outputIndexes": [ 1596 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1596 ] , "main_type": "NONE", "name": "Shape6439", "outputIndexes": [ 1597 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1596 ] , "main_type": "NONE", "name": "Rank6441", "outputIndexes": [ 1598 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1598, 1598 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6443", "outputIndexes": [ 1599 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6444", "outputIndexes": [ 1600 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6446", "outputIndexes": [ 1601 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1601 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6447", "outputIndexes": [ 1602 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1597, 1600, 1602, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6450", "outputIndexes": [ 1603 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6451", "outputIndexes": [ 1604 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1604, 1604 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6453", "outputIndexes": [ 1605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596, 1605, 1599 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_246_output_0", "outputIndexes": [ 1606 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_512_output_0", "outputIndexes": [ 1607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6461", "outputIndexes": [ 1608 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1601 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6464", "outputIndexes": [ 1609 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1597, 1608, 1609, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6467", "outputIndexes": [ 1610 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6468", "outputIndexes": [ 1611 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1611 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6469", "outputIndexes": [ 1612 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 1611 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6470", "outputIndexes": [ 1613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596, 1613, 1599 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_247_output_0", "outputIndexes": [ 1614 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1614, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_513_output_0", "outputIndexes": [ 1615 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1607, 1615, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_208_output_0", "outputIndexes": [ 1616 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1595, 1616 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_145_output_0", "outputIndexes": [ 1617 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1016519094, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_16/Mul_1_output_0", "outputIndexes": [ 1619 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_128_output_0", "outputIndexes": [ 1620 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619 ] , "main_type": "NONE", "name": "/Shape_226_output_0", "outputIndexes": [ 1621 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1621 ] , "main_type": "NONE", "name": "Shape6589", "outputIndexes": [ 1622 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1621 ] , "main_type": "NONE", "name": "Rank6591", "outputIndexes": [ 1623 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1623, 1623 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6593", "outputIndexes": [ 1624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6594", "outputIndexes": [ 1625 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6596", "outputIndexes": [ 1626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6597", "outputIndexes": [ 1627 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1622, 1625, 1627, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6600", "outputIndexes": [ 1628 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1628 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6601", "outputIndexes": [ 1629 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1629 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6602", "outputIndexes": [ 1630 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 1629 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6603", "outputIndexes": [ 1631 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1621, 1631, 1624 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_248_output_0", "outputIndexes": [ 1632 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1632, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_48_output_0", "outputIndexes": [ 1633 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_519_output_0", "outputIndexes": [ 1634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619, 1634, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_65_output_0", "outputIndexes": [ 1635 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1635 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_32_output_0", "outputIndexes": [ 1636 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_518_output_0", "outputIndexes": [ 1637 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619, 22, 1637, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_64_output_0", "outputIndexes": [ 1638 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1636, 1638 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_211_output_0", "outputIndexes": [ 1639 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1639, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_129_output_0", "outputIndexes": [ 1640 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1620, 1640 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_83_output_0", "outputIndexes": [ 1641 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3905 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1016520118, 1310742, 327680, 0, 0 ] } , "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": [ 3910 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3910 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3911 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3911 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1642 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_514_output_0", "outputIndexes": [ 1643 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1614, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_515_output_0", "outputIndexes": [ 1644 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1643, 1644, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_209_output_0", "outputIndexes": [ 1645 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1642, 1645 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_146_output_0", "outputIndexes": [ 1646 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1646 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1018158540, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_16/Mul_1_output_0", "outputIndexes": [ 1648 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_130_output_0", "outputIndexes": [ 1649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648 ] , "main_type": "NONE", "name": "/Shape_227_output_0", "outputIndexes": [ 1650 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1650 ] , "main_type": "NONE", "name": "Shape6485", "outputIndexes": [ 1651 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1650 ] , "main_type": "NONE", "name": "Rank6487", "outputIndexes": [ 1652 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1652, 1652 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6489", "outputIndexes": [ 1653 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6490", "outputIndexes": [ 1654 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6492", "outputIndexes": [ 1655 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1655 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6493", "outputIndexes": [ 1656 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651, 1654, 1656, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6496", "outputIndexes": [ 1657 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1657 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6497", "outputIndexes": [ 1658 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1658 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6498", "outputIndexes": [ 1659 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1659, 1658 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6499", "outputIndexes": [ 1660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1650, 1660, 1653 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_249_output_0", "outputIndexes": [ 1661 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_49_output_0", "outputIndexes": [ 1662 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1662, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_521_output_0", "outputIndexes": [ 1663 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 1663, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_67_output_0", "outputIndexes": [ 1664 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1664 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_33_output_0", "outputIndexes": [ 1665 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1662, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_520_output_0", "outputIndexes": [ 1666 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 22, 1666, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_66_output_0", "outputIndexes": [ 1667 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1665, 1667 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_212_output_0", "outputIndexes": [ 1668 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1668, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_131_output_0", "outputIndexes": [ 1669 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1649, 1669 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_84_output_0", "outputIndexes": [ 1670 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3905 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1018159564, 1310742, 327680, 0, 0 ] } , "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": [ 3914 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3914 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3915 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3915 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1671 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_516_output_0", "outputIndexes": [ 1672 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1614, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_517_output_0", "outputIndexes": [ 1673 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 1673, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_210_output_0", "outputIndexes": [ 1674 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1671, 1674 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_147_output_0", "outputIndexes": [ 1675 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1641, 1670, 1675, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_152_output_0", "outputIndexes": [ 1676 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1676 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3916 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3916 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3917 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3917 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1019797986, 5242902, 1310720, 0, 0 ] } , "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": [ 3918 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3918 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3919 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3919 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1677 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1593, 1677 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_86_output_0", "outputIndexes": [ 1678 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1678 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1026351608, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_16/Mul_1_output_0", "outputIndexes": [ 1679 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1679 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3920 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3920 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3921 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3921 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1026372088, 12451862, 3112960, 0, 0 ] } , "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": [ 3922 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3922 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3923 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3923 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1680 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1680 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_16/Mul_output_0", "outputIndexes": [ 1681 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3921 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1041936910, 12451862, 3112960, 0, 0 ] } , "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": [ 3926 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3926 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3927 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3927 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1682 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1681, 1682 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_16/Mul_output_0", "outputIndexes": [ 1683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1683 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3928 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3928 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3929 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3929 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1057501732, 12451862, 3112960, 0, 0 ] } , "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": [ 3930 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3930 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3931 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3931 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1684 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1678, 1684 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_87_output_0", "outputIndexes": [ 1685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1685, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_153_output_0", "outputIndexes": [ 1686 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1073066554, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_17/Mul_1_output_0", "outputIndexes": [ 1687 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1687 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3932 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3932 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3933 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3933 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1073087034, 5242902, 1310720, 0, 0 ] } , "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": [ 3934 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3934 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3935 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3935 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1688 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1687 ] , "main_type": "NONE", "name": "/Shape_238_output_0", "outputIndexes": [ 1689 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1689 ] , "main_type": "NONE", "name": "Shape6828", "outputIndexes": [ 1690 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1689 ] , "main_type": "NONE", "name": "Rank6830", "outputIndexes": [ 1691 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1691, 1691 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6832", "outputIndexes": [ 1692 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1692 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6833", "outputIndexes": [ 1693 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1692, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6835", "outputIndexes": [ 1694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1694 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6836", "outputIndexes": [ 1695 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1690, 1693, 1695, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6839", "outputIndexes": [ 1696 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6840", "outputIndexes": [ 1697 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1697, 1697 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6842", "outputIndexes": [ 1698 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1689, 1698, 1692 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_261_output_0", "outputIndexes": [ 1699 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_544_output_0", "outputIndexes": [ 1700 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1692 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6850", "outputIndexes": [ 1701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1694 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6853", "outputIndexes": [ 1702 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1690, 1701, 1702, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6856", "outputIndexes": [ 1703 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1703 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6857", "outputIndexes": [ 1704 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1704 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6858", "outputIndexes": [ 1705 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1705, 1704 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6859", "outputIndexes": [ 1706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1689, 1706, 1692 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_262_output_0", "outputIndexes": [ 1707 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1707, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_545_output_0", "outputIndexes": [ 1708 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1700, 1708, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_221_output_0", "outputIndexes": [ 1709 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1688, 1709 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_154_output_0", "outputIndexes": [ 1710 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1710 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1079640656, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_17/Mul_1_output_0", "outputIndexes": [ 1712 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_136_output_0", "outputIndexes": [ 1713 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712 ] , "main_type": "NONE", "name": "/Shape_240_output_0", "outputIndexes": [ 1714 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1714 ] , "main_type": "NONE", "name": "Shape6978", "outputIndexes": [ 1715 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1714 ] , "main_type": "NONE", "name": "Rank6980", "outputIndexes": [ 1716 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1716, 1716 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6982", "outputIndexes": [ 1717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1717 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6983", "outputIndexes": [ 1718 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1717, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6985", "outputIndexes": [ 1719 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1719 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6986", "outputIndexes": [ 1720 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715, 1718, 1720, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6989", "outputIndexes": [ 1721 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1721 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6990", "outputIndexes": [ 1722 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1722 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6991", "outputIndexes": [ 1723 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1723, 1722 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6992", "outputIndexes": [ 1724 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1714, 1724, 1717 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_263_output_0", "outputIndexes": [ 1725 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1725, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_51_output_0", "outputIndexes": [ 1726 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1726, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_551_output_0", "outputIndexes": [ 1727 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 1727, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_69_output_0", "outputIndexes": [ 1728 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1728 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_34_output_0", "outputIndexes": [ 1729 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1726, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_550_output_0", "outputIndexes": [ 1730 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 22, 1730, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_68_output_0", "outputIndexes": [ 1731 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1729, 1731 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_224_output_0", "outputIndexes": [ 1732 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1732, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_137_output_0", "outputIndexes": [ 1733 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1713, 1733 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_88_output_0", "outputIndexes": [ 1734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3933 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1079641680, 1310742, 327680, 0, 0 ] } , "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": [ 3938 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3938 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3939 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3939 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_546_output_0", "outputIndexes": [ 1736 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1707, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_547_output_0", "outputIndexes": [ 1737 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1736, 1737, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_222_output_0", "outputIndexes": [ 1738 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1735, 1738 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_155_output_0", "outputIndexes": [ 1739 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1081280102, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_17/Mul_1_output_0", "outputIndexes": [ 1741 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_138_output_0", "outputIndexes": [ 1742 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741 ] , "main_type": "NONE", "name": "/Shape_241_output_0", "outputIndexes": [ 1743 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1743 ] , "main_type": "NONE", "name": "Shape6874", "outputIndexes": [ 1744 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1743 ] , "main_type": "NONE", "name": "Rank6876", "outputIndexes": [ 1745 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745, 1745 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6878", "outputIndexes": [ 1746 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6879", "outputIndexes": [ 1747 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1746, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6881", "outputIndexes": [ 1748 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1748 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6882", "outputIndexes": [ 1749 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1744, 1747, 1749, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6885", "outputIndexes": [ 1750 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6886", "outputIndexes": [ 1751 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1751 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6887", "outputIndexes": [ 1752 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1752, 1751 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6888", "outputIndexes": [ 1753 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743, 1753, 1746 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_264_output_0", "outputIndexes": [ 1754 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1754, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_52_output_0", "outputIndexes": [ 1755 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1755, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_553_output_0", "outputIndexes": [ 1756 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 1756, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_71_output_0", "outputIndexes": [ 1757 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1757 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_35_output_0", "outputIndexes": [ 1758 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1755, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_552_output_0", "outputIndexes": [ 1759 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 22, 1759, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_70_output_0", "outputIndexes": [ 1760 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 1760 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_225_output_0", "outputIndexes": [ 1761 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_139_output_0", "outputIndexes": [ 1762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1742, 1762 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_89_output_0", "outputIndexes": [ 1763 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3933 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1081281126, 1310742, 327680, 0, 0 ] } , "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": [ 3942 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3942 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3943 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3943 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1764 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_548_output_0", "outputIndexes": [ 1765 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1707, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_549_output_0", "outputIndexes": [ 1766 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1765, 1766, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_223_output_0", "outputIndexes": [ 1767 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1764, 1767 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_156_output_0", "outputIndexes": [ 1768 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734, 1763, 1768, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_161_output_0", "outputIndexes": [ 1769 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1769 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3944 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3944 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3945 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3945 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1082919548, 5242902, 1310720, 0, 0 ] } , "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": [ 3946 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3946 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3947 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3947 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1770 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686, 1770 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_91_output_0", "outputIndexes": [ 1771 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1771 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1089473170, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_17/Mul_1_output_0", "outputIndexes": [ 1772 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1772 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3948 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3948 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3949 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3949 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1089493650, 12451862, 3112960, 0, 0 ] } , "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": [ 3950 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3950 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3951 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3951 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1773 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1773 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_17/Mul_output_0", "outputIndexes": [ 1774 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3949 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1105058472, 12451862, 3112960, 0, 0 ] } , "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": [ 3954 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3954 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3955 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3955 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1775 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1774, 1775 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_17/Mul_output_0", "outputIndexes": [ 1776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1776 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3956 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3956 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3957 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3957 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1120623294, 12451862, 3112960, 0, 0 ] } , "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": [ 3958 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3958 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3959 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3959 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1777 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1771, 1777 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_92_output_0", "outputIndexes": [ 1778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1778, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_162_output_0", "outputIndexes": [ 1779 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1779 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1136188116, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_18/Mul_1_output_0", "outputIndexes": [ 1780 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1780 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3960 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3960 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3961 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3961 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1136208596, 5242902, 1310720, 0, 0 ] } , "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": [ 3962 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3962 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3963 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3963 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1781 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1780 ] , "main_type": "NONE", "name": "/Shape_252_output_0", "outputIndexes": [ 1782 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1782 ] , "main_type": "NONE", "name": "Shape7217", "outputIndexes": [ 1783 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1782 ] , "main_type": "NONE", "name": "Rank7219", "outputIndexes": [ 1784 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1784, 1784 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7221", "outputIndexes": [ 1785 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7222", "outputIndexes": [ 1786 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7224", "outputIndexes": [ 1787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7225", "outputIndexes": [ 1788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1783, 1786, 1788, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7228", "outputIndexes": [ 1789 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1789 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7229", "outputIndexes": [ 1790 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 1790 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7231", "outputIndexes": [ 1791 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1782, 1791, 1785 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_276_output_0", "outputIndexes": [ 1792 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_576_output_0", "outputIndexes": [ 1793 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7239", "outputIndexes": [ 1794 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7242", "outputIndexes": [ 1795 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1783, 1794, 1795, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7245", "outputIndexes": [ 1796 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1796 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7246", "outputIndexes": [ 1797 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1797 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7247", "outputIndexes": [ 1798 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1798, 1797 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7248", "outputIndexes": [ 1799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1782, 1799, 1785 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_277_output_0", "outputIndexes": [ 1800 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1800, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_577_output_0", "outputIndexes": [ 1801 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1793, 1801, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_234_output_0", "outputIndexes": [ 1802 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1781, 1802 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_163_output_0", "outputIndexes": [ 1803 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1803 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1142762218, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_18/Mul_1_output_0", "outputIndexes": [ 1805 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_144_output_0", "outputIndexes": [ 1806 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805 ] , "main_type": "NONE", "name": "/Shape_254_output_0", "outputIndexes": [ 1807 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1807 ] , "main_type": "NONE", "name": "Shape7367", "outputIndexes": [ 1808 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1807 ] , "main_type": "NONE", "name": "Rank7369", "outputIndexes": [ 1809 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1809, 1809 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7371", "outputIndexes": [ 1810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1810 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7372", "outputIndexes": [ 1811 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1810, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7374", "outputIndexes": [ 1812 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1812 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7375", "outputIndexes": [ 1813 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1808, 1811, 1813, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7378", "outputIndexes": [ 1814 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1814 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7379", "outputIndexes": [ 1815 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1815 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7380", "outputIndexes": [ 1816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1816, 1815 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7381", "outputIndexes": [ 1817 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1807, 1817, 1810 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_278_output_0", "outputIndexes": [ 1818 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_54_output_0", "outputIndexes": [ 1819 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_583_output_0", "outputIndexes": [ 1820 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 1820, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_73_output_0", "outputIndexes": [ 1821 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_36_output_0", "outputIndexes": [ 1822 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_582_output_0", "outputIndexes": [ 1823 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 22, 1823, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_72_output_0", "outputIndexes": [ 1824 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1822, 1824 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_237_output_0", "outputIndexes": [ 1825 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1825, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_145_output_0", "outputIndexes": [ 1826 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1806, 1826 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_93_output_0", "outputIndexes": [ 1827 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3961 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1142763242, 1310742, 327680, 0, 0 ] } , "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": [ 3966 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3966 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3967 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3967 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1828 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_578_output_0", "outputIndexes": [ 1829 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1800, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_579_output_0", "outputIndexes": [ 1830 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829, 1830, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_235_output_0", "outputIndexes": [ 1831 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1828, 1831 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_164_output_0", "outputIndexes": [ 1832 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1144401664, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_18/Mul_1_output_0", "outputIndexes": [ 1834 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_146_output_0", "outputIndexes": [ 1835 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "NONE", "name": "/Shape_255_output_0", "outputIndexes": [ 1836 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1836 ] , "main_type": "NONE", "name": "Shape7263", "outputIndexes": [ 1837 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1836 ] , "main_type": "NONE", "name": "Rank7265", "outputIndexes": [ 1838 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1838, 1838 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7267", "outputIndexes": [ 1839 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7268", "outputIndexes": [ 1840 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7270", "outputIndexes": [ 1841 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1841 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7271", "outputIndexes": [ 1842 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1837, 1840, 1842, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7274", "outputIndexes": [ 1843 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1843 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7275", "outputIndexes": [ 1844 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1844 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7276", "outputIndexes": [ 1845 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845, 1844 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7277", "outputIndexes": [ 1846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1836, 1846, 1839 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_279_output_0", "outputIndexes": [ 1847 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_55_output_0", "outputIndexes": [ 1848 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1848, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_585_output_0", "outputIndexes": [ 1849 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 1849, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_75_output_0", "outputIndexes": [ 1850 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_37_output_0", "outputIndexes": [ 1851 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1848, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_584_output_0", "outputIndexes": [ 1852 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834, 22, 1852, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_74_output_0", "outputIndexes": [ 1853 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1851, 1853 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_238_output_0", "outputIndexes": [ 1854 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1854, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_147_output_0", "outputIndexes": [ 1855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1835, 1855 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_94_output_0", "outputIndexes": [ 1856 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3961 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1144402688, 1310742, 327680, 0, 0 ] } , "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": [ 3970 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3970 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3971 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3971 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1857 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_580_output_0", "outputIndexes": [ 1858 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1800, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_581_output_0", "outputIndexes": [ 1859 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1858, 1859, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_236_output_0", "outputIndexes": [ 1860 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1857, 1860 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_165_output_0", "outputIndexes": [ 1861 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827, 1856, 1861, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_170_output_0", "outputIndexes": [ 1862 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1862 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 3972 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3972 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 3973 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3973 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1146041110, 5242902, 1310720, 0, 0 ] } , "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": [ 3974 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3974 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 3975 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3975 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1863 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1779, 1863 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_96_output_0", "outputIndexes": [ 1864 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1864 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1152594732, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_18/Mul_1_output_0", "outputIndexes": [ 1865 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1865 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 3976 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3976 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 3977 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3977 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1152615212, 12451862, 3112960, 0, 0 ] } , "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": [ 3978 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3978 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 3979 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3979 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1866 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1866 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_18/Mul_output_0", "outputIndexes": [ 1867 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3977 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1168180034, 12451862, 3112960, 0, 0 ] } , "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": [ 3982 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3982 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 3983 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3983 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1868 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1867, 1868 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_18/Mul_output_0", "outputIndexes": [ 1869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1869 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 3984 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3984 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 3985 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3985 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1183744856, 12451862, 3112960, 0, 0 ] } , "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": [ 3986 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3986 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 3987 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3987 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1870 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1864, 1870 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_97_output_0", "outputIndexes": [ 1871 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1871, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_171_output_0", "outputIndexes": [ 1872 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1199309678, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_19/Mul_1_output_0", "outputIndexes": [ 1873 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 3988 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3988 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 3989 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3989 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1199330158, 5242902, 1310720, 0, 0 ] } , "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": [ 3990 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3990 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 3991 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3991 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1874 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873 ] , "main_type": "NONE", "name": "/Shape_266_output_0", "outputIndexes": [ 1875 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1875 ] , "main_type": "NONE", "name": "Shape7606", "outputIndexes": [ 1876 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1875 ] , "main_type": "NONE", "name": "Rank7608", "outputIndexes": [ 1877 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 1877 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7610", "outputIndexes": [ 1878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1878 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7611", "outputIndexes": [ 1879 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1878, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7613", "outputIndexes": [ 1880 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1880 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7614", "outputIndexes": [ 1881 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1876, 1879, 1881, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7617", "outputIndexes": [ 1882 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7618", "outputIndexes": [ 1883 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1883, 1883 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7620", "outputIndexes": [ 1884 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1875, 1884, 1878 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_291_output_0", "outputIndexes": [ 1885 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1885, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_608_output_0", "outputIndexes": [ 1886 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1878 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7628", "outputIndexes": [ 1887 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1880 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7631", "outputIndexes": [ 1888 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1876, 1887, 1888, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7634", "outputIndexes": [ 1889 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1889 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7635", "outputIndexes": [ 1890 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1890 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7636", "outputIndexes": [ 1891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 1890 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7637", "outputIndexes": [ 1892 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1875, 1892, 1878 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_292_output_0", "outputIndexes": [ 1893 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_609_output_0", "outputIndexes": [ 1894 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1886, 1894, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_247_output_0", "outputIndexes": [ 1895 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1874, 1895 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_172_output_0", "outputIndexes": [ 1896 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1896 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1205883780, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_19/Mul_1_output_0", "outputIndexes": [ 1898 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1898, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_152_output_0", "outputIndexes": [ 1899 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1898 ] , "main_type": "NONE", "name": "/Shape_268_output_0", "outputIndexes": [ 1900 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1900 ] , "main_type": "NONE", "name": "Shape7756", "outputIndexes": [ 1901 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1900 ] , "main_type": "NONE", "name": "Rank7758", "outputIndexes": [ 1902 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1902, 1902 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7760", "outputIndexes": [ 1903 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1903 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7761", "outputIndexes": [ 1904 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1903, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7763", "outputIndexes": [ 1905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1905 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7764", "outputIndexes": [ 1906 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1901, 1904, 1906, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7767", "outputIndexes": [ 1907 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7768", "outputIndexes": [ 1908 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1908 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7769", "outputIndexes": [ 1909 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909, 1908 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7770", "outputIndexes": [ 1910 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1900, 1910, 1903 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_293_output_0", "outputIndexes": [ 1911 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1911, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_57_output_0", "outputIndexes": [ 1912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_615_output_0", "outputIndexes": [ 1913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1898, 1913, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_77_output_0", "outputIndexes": [ 1914 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_38_output_0", "outputIndexes": [ 1915 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_614_output_0", "outputIndexes": [ 1916 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1898, 22, 1916, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_76_output_0", "outputIndexes": [ 1917 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1915, 1917 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_250_output_0", "outputIndexes": [ 1918 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_153_output_0", "outputIndexes": [ 1919 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1899, 1919 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_98_output_0", "outputIndexes": [ 1920 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3989 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1205884804, 1310742, 327680, 0, 0 ] } , "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": [ 3994 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3994 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 3995 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3995 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1921 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1885, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_610_output_0", "outputIndexes": [ 1922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_611_output_0", "outputIndexes": [ 1923 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1922, 1923, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_248_output_0", "outputIndexes": [ 1924 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 1924 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_173_output_0", "outputIndexes": [ 1925 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1925 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1207523226, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_19/Mul_1_output_0", "outputIndexes": [ 1927 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_154_output_0", "outputIndexes": [ 1928 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927 ] , "main_type": "NONE", "name": "/Shape_269_output_0", "outputIndexes": [ 1929 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1929 ] , "main_type": "NONE", "name": "Shape7652", "outputIndexes": [ 1930 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1929 ] , "main_type": "NONE", "name": "Rank7654", "outputIndexes": [ 1931 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1931, 1931 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7656", "outputIndexes": [ 1932 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7657", "outputIndexes": [ 1933 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7659", "outputIndexes": [ 1934 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1934 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7660", "outputIndexes": [ 1935 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1930, 1933, 1935, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7663", "outputIndexes": [ 1936 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7664", "outputIndexes": [ 1937 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 1937 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7665", "outputIndexes": [ 1938 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1938, 1937 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7666", "outputIndexes": [ 1939 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1929, 1939, 1932 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_294_output_0", "outputIndexes": [ 1940 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1940, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_58_output_0", "outputIndexes": [ 1941 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_617_output_0", "outputIndexes": [ 1942 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 1942, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_79_output_0", "outputIndexes": [ 1943 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1943 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_39_output_0", "outputIndexes": [ 1944 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_616_output_0", "outputIndexes": [ 1945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1927, 22, 1945, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_78_output_0", "outputIndexes": [ 1946 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944, 1946 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_251_output_0", "outputIndexes": [ 1947 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1947, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_155_output_0", "outputIndexes": [ 1948 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 1948 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_99_output_0", "outputIndexes": [ 1949 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3989 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1207524250, 1310742, 327680, 0, 0 ] } , "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": [ 3998 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3998 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 3999 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3999 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1950 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1885, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_612_output_0", "outputIndexes": [ 1951 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_613_output_0", "outputIndexes": [ 1952 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1951, 1952, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_249_output_0", "outputIndexes": [ 1953 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1950, 1953 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_174_output_0", "outputIndexes": [ 1954 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 1949, 1954, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_179_output_0", "outputIndexes": [ 1955 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4000 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4000 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4001 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4001 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1209162672, 5242902, 1310720, 0, 0 ] } , "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": [ 4002 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4002 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4003 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4003 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1956 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872, 1956 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_101_output_0", "outputIndexes": [ 1957 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1957 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1215716294, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_19/Mul_1_output_0", "outputIndexes": [ 1958 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1958 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4004 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4004 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4005 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4005 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1215736774, 12451862, 3112960, 0, 0 ] } , "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": [ 4006 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4006 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4007 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4007 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1959 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1959 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_19/Mul_output_0", "outputIndexes": [ 1960 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4005 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1231301596, 12451862, 3112960, 0, 0 ] } , "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": [ 4010 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4010 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4011 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4011 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1961 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1960, 1961 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_19/Mul_output_0", "outputIndexes": [ 1962 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1962 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4012 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4012 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4013 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4013 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1246866418, 12451862, 3112960, 0, 0 ] } , "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": [ 4014 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4014 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4015 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4015 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1963 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1957, 1963 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_102_output_0", "outputIndexes": [ 1964 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1964, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_180_output_0", "outputIndexes": [ 1965 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1965 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1262431240, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_20/Mul_1_output_0", "outputIndexes": [ 1966 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4016 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4016 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4017 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4017 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1262451720, 5242902, 1310720, 0, 0 ] } , "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": [ 4018 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4018 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4019 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4019 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1967 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966 ] , "main_type": "NONE", "name": "/Shape_280_output_0", "outputIndexes": [ 1968 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "Shape7995", "outputIndexes": [ 1969 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "Rank7997", "outputIndexes": [ 1970 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1970, 1970 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7999", "outputIndexes": [ 1971 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8000", "outputIndexes": [ 1972 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8002", "outputIndexes": [ 1973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1973 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8003", "outputIndexes": [ 1974 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1969, 1972, 1974, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8006", "outputIndexes": [ 1975 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8007", "outputIndexes": [ 1976 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1976, 1976 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8009", "outputIndexes": [ 1977 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 1977, 1971 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_306_output_0", "outputIndexes": [ 1978 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1978, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_640_output_0", "outputIndexes": [ 1979 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8017", "outputIndexes": [ 1980 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1973 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8020", "outputIndexes": [ 1981 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1969, 1980, 1981, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8023", "outputIndexes": [ 1982 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8024", "outputIndexes": [ 1983 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 1983 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8025", "outputIndexes": [ 1984 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1984, 1983 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8026", "outputIndexes": [ 1985 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 1985, 1971 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_307_output_0", "outputIndexes": [ 1986 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1986, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_641_output_0", "outputIndexes": [ 1987 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1979, 1987, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_260_output_0", "outputIndexes": [ 1988 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1967, 1988 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_181_output_0", "outputIndexes": [ 1989 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1989 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1269005342, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_20/Mul_1_output_0", "outputIndexes": [ 1991 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_160_output_0", "outputIndexes": [ 1992 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991 ] , "main_type": "NONE", "name": "/Shape_282_output_0", "outputIndexes": [ 1993 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1993 ] , "main_type": "NONE", "name": "Shape8145", "outputIndexes": [ 1994 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1993 ] , "main_type": "NONE", "name": "Rank8147", "outputIndexes": [ 1995 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1995, 1995 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8149", "outputIndexes": [ 1996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8150", "outputIndexes": [ 1997 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8152", "outputIndexes": [ 1998 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1998 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8153", "outputIndexes": [ 1999 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1994, 1997, 1999, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8156", "outputIndexes": [ 2000 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2000 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8157", "outputIndexes": [ 2001 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2001 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8158", "outputIndexes": [ 2002 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2002, 2001 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8159", "outputIndexes": [ 2003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1993, 2003, 1996 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_308_output_0", "outputIndexes": [ 2004 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2004, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_60_output_0", "outputIndexes": [ 2005 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_647_output_0", "outputIndexes": [ 2006 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 2006, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_81_output_0", "outputIndexes": [ 2007 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_40_output_0", "outputIndexes": [ 2008 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_646_output_0", "outputIndexes": [ 2009 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1991, 22, 2009, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_80_output_0", "outputIndexes": [ 2010 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2010 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_263_output_0", "outputIndexes": [ 2011 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2011, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_161_output_0", "outputIndexes": [ 2012 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1992, 2012 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_103_output_0", "outputIndexes": [ 2013 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4017 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1269006366, 1310742, 327680, 0, 0 ] } , "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": [ 4022 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4022 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4023 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4023 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2014 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1978, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_642_output_0", "outputIndexes": [ 2015 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1986, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_643_output_0", "outputIndexes": [ 2016 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2015, 2016, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_261_output_0", "outputIndexes": [ 2017 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2014, 2017 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_182_output_0", "outputIndexes": [ 2018 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2018 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1270644788, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_20/Mul_1_output_0", "outputIndexes": [ 2020 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_162_output_0", "outputIndexes": [ 2021 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020 ] , "main_type": "NONE", "name": "/Shape_283_output_0", "outputIndexes": [ 2022 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2022 ] , "main_type": "NONE", "name": "Shape8041", "outputIndexes": [ 2023 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2022 ] , "main_type": "NONE", "name": "Rank8043", "outputIndexes": [ 2024 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2024, 2024 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8045", "outputIndexes": [ 2025 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8046", "outputIndexes": [ 2026 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8048", "outputIndexes": [ 2027 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2027 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8049", "outputIndexes": [ 2028 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2023, 2026, 2028, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8052", "outputIndexes": [ 2029 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2029 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8053", "outputIndexes": [ 2030 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2030 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8054", "outputIndexes": [ 2031 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2031, 2030 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8055", "outputIndexes": [ 2032 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2022, 2032, 2025 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_309_output_0", "outputIndexes": [ 2033 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_61_output_0", "outputIndexes": [ 2034 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2034, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_649_output_0", "outputIndexes": [ 2035 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 2035, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_83_output_0", "outputIndexes": [ 2036 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2036 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_41_output_0", "outputIndexes": [ 2037 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2034, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_648_output_0", "outputIndexes": [ 2038 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2020, 22, 2038, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_82_output_0", "outputIndexes": [ 2039 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2037, 2039 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_264_output_0", "outputIndexes": [ 2040 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2040, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_163_output_0", "outputIndexes": [ 2041 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2021, 2041 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_104_output_0", "outputIndexes": [ 2042 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4017 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1270645812, 1310742, 327680, 0, 0 ] } , "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": [ 4026 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4026 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4027 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4027 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2043 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1978, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_644_output_0", "outputIndexes": [ 2044 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1986, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_645_output_0", "outputIndexes": [ 2045 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2044, 2045, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_262_output_0", "outputIndexes": [ 2046 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2043, 2046 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_183_output_0", "outputIndexes": [ 2047 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2013, 2042, 2047, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_188_output_0", "outputIndexes": [ 2048 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2048 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4028 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4028 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4029 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4029 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1272284234, 5242902, 1310720, 0, 0 ] } , "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": [ 4030 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4030 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4031 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4031 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2049 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1965, 2049 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_106_output_0", "outputIndexes": [ 2050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2050 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1278837856, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_20/Mul_1_output_0", "outputIndexes": [ 2051 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2051 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4032 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4032 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4033 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4033 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1278858336, 12451862, 3112960, 0, 0 ] } , "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": [ 4034 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4034 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4035 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4035 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2052 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_20/Mul_output_0", "outputIndexes": [ 2053 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4033 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1294423158, 12451862, 3112960, 0, 0 ] } , "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": [ 4038 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4038 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4039 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4039 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2054 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2053, 2054 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_20/Mul_output_0", "outputIndexes": [ 2055 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4040 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4040 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4041 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4041 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1309987980, 12451862, 3112960, 0, 0 ] } , "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": [ 4042 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4042 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4043 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4043 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2056 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2050, 2056 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_107_output_0", "outputIndexes": [ 2057 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_189_output_0", "outputIndexes": [ 2058 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2058 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1325552802, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_21/Mul_1_output_0", "outputIndexes": [ 2059 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4044 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4044 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4045 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4045 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1325573282, 5242902, 1310720, 0, 0 ] } , "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": [ 4046 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4046 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4047 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4047 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2060 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059 ] , "main_type": "NONE", "name": "/Shape_294_output_0", "outputIndexes": [ 2061 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2061 ] , "main_type": "NONE", "name": "Shape8384", "outputIndexes": [ 2062 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2061 ] , "main_type": "NONE", "name": "Rank8386", "outputIndexes": [ 2063 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2063, 2063 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8388", "outputIndexes": [ 2064 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8389", "outputIndexes": [ 2065 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8391", "outputIndexes": [ 2066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2066 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8392", "outputIndexes": [ 2067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062, 2065, 2067, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8395", "outputIndexes": [ 2068 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8396", "outputIndexes": [ 2069 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2069, 2069 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8398", "outputIndexes": [ 2070 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2061, 2070, 2064 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_321_output_0", "outputIndexes": [ 2071 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_672_output_0", "outputIndexes": [ 2072 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8406", "outputIndexes": [ 2073 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2066 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8409", "outputIndexes": [ 2074 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062, 2073, 2074, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8412", "outputIndexes": [ 2075 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2075 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8413", "outputIndexes": [ 2076 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2076 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8414", "outputIndexes": [ 2077 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2077, 2076 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8415", "outputIndexes": [ 2078 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2061, 2078, 2064 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_322_output_0", "outputIndexes": [ 2079 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2079, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_673_output_0", "outputIndexes": [ 2080 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2072, 2080, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_273_output_0", "outputIndexes": [ 2081 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2060, 2081 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_190_output_0", "outputIndexes": [ 2082 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2082 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1332126904, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_21/Mul_1_output_0", "outputIndexes": [ 2084 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_168_output_0", "outputIndexes": [ 2085 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084 ] , "main_type": "NONE", "name": "/Shape_296_output_0", "outputIndexes": [ 2086 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2086 ] , "main_type": "NONE", "name": "Shape8534", "outputIndexes": [ 2087 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2086 ] , "main_type": "NONE", "name": "Rank8536", "outputIndexes": [ 2088 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2088, 2088 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8538", "outputIndexes": [ 2089 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2089 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8539", "outputIndexes": [ 2090 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2089, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8541", "outputIndexes": [ 2091 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2091 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8542", "outputIndexes": [ 2092 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087, 2090, 2092, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8545", "outputIndexes": [ 2093 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8546", "outputIndexes": [ 2094 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2094 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8547", "outputIndexes": [ 2095 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095, 2094 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8548", "outputIndexes": [ 2096 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2086, 2096, 2089 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_323_output_0", "outputIndexes": [ 2097 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_63_output_0", "outputIndexes": [ 2098 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_679_output_0", "outputIndexes": [ 2099 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084, 2099, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_85_output_0", "outputIndexes": [ 2100 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2100 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_42_output_0", "outputIndexes": [ 2101 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_678_output_0", "outputIndexes": [ 2102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2084, 22, 2102, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_84_output_0", "outputIndexes": [ 2103 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101, 2103 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_276_output_0", "outputIndexes": [ 2104 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2104, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_169_output_0", "outputIndexes": [ 2105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085, 2105 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_108_output_0", "outputIndexes": [ 2106 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4045 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1332127928, 1310742, 327680, 0, 0 ] } , "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": [ 4050 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4050 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4051 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4051 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2107 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_674_output_0", "outputIndexes": [ 2108 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2079, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_675_output_0", "outputIndexes": [ 2109 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2108, 2109, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_274_output_0", "outputIndexes": [ 2110 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2107, 2110 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_191_output_0", "outputIndexes": [ 2111 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2111 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1333766350, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_21/Mul_1_output_0", "outputIndexes": [ 2113 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_170_output_0", "outputIndexes": [ 2114 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113 ] , "main_type": "NONE", "name": "/Shape_297_output_0", "outputIndexes": [ 2115 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2115 ] , "main_type": "NONE", "name": "Shape8430", "outputIndexes": [ 2116 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2115 ] , "main_type": "NONE", "name": "Rank8432", "outputIndexes": [ 2117 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 2117 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8434", "outputIndexes": [ 2118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8435", "outputIndexes": [ 2119 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8437", "outputIndexes": [ 2120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2120 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8438", "outputIndexes": [ 2121 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2116, 2119, 2121, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8441", "outputIndexes": [ 2122 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8442", "outputIndexes": [ 2123 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2123 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8443", "outputIndexes": [ 2124 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124, 2123 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8444", "outputIndexes": [ 2125 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2115, 2125, 2118 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_324_output_0", "outputIndexes": [ 2126 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2126, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_64_output_0", "outputIndexes": [ 2127 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2127, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_681_output_0", "outputIndexes": [ 2128 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 2128, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_87_output_0", "outputIndexes": [ 2129 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2129 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_43_output_0", "outputIndexes": [ 2130 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2127, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_680_output_0", "outputIndexes": [ 2131 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2113, 22, 2131, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_86_output_0", "outputIndexes": [ 2132 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2130, 2132 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_277_output_0", "outputIndexes": [ 2133 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_171_output_0", "outputIndexes": [ 2134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 2134 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_109_output_0", "outputIndexes": [ 2135 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4045 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1333767374, 1310742, 327680, 0, 0 ] } , "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": [ 4054 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4054 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4055 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4055 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2136 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_676_output_0", "outputIndexes": [ 2137 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2079, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_677_output_0", "outputIndexes": [ 2138 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2137, 2138, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_275_output_0", "outputIndexes": [ 2139 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2136, 2139 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_192_output_0", "outputIndexes": [ 2140 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 2135, 2140, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_197_output_0", "outputIndexes": [ 2141 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2141 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4056 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4056 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4057 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4057 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1335405796, 5242902, 1310720, 0, 0 ] } , "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": [ 4058 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4058 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4059 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4059 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2142 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2058, 2142 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_111_output_0", "outputIndexes": [ 2143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2143 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1341959418, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_21/Mul_1_output_0", "outputIndexes": [ 2144 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4060 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4060 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4061 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4061 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1341979898, 12451862, 3112960, 0, 0 ] } , "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": [ 4062 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4062 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4063 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4063 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2145 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2145 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_21/Mul_output_0", "outputIndexes": [ 2146 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4061 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1357544720, 12451862, 3112960, 0, 0 ] } , "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": [ 4066 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4066 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4067 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4067 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2147 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146, 2147 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_21/Mul_output_0", "outputIndexes": [ 2148 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2148 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4068 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4068 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4069 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4069 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1373109542, 12451862, 3112960, 0, 0 ] } , "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": [ 4070 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4070 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4071 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4071 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2149 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2143, 2149 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_112_output_0", "outputIndexes": [ 2150 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2150, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_198_output_0", "outputIndexes": [ 2151 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1388674364, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_22/Mul_1_output_0", "outputIndexes": [ 2152 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2152 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4072 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4072 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4073 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4073 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1388694844, 5242902, 1310720, 0, 0 ] } , "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": [ 4074 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4074 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4075 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4075 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2153 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2152 ] , "main_type": "NONE", "name": "/Shape_308_output_0", "outputIndexes": [ 2154 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2154 ] , "main_type": "NONE", "name": "Shape8773", "outputIndexes": [ 2155 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2154 ] , "main_type": "NONE", "name": "Rank8775", "outputIndexes": [ 2156 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2156, 2156 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8777", "outputIndexes": [ 2157 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8778", "outputIndexes": [ 2158 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8780", "outputIndexes": [ 2159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2159 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8781", "outputIndexes": [ 2160 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2155, 2158, 2160, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8784", "outputIndexes": [ 2161 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8785", "outputIndexes": [ 2162 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2162, 2162 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8787", "outputIndexes": [ 2163 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2154, 2163, 2157 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_336_output_0", "outputIndexes": [ 2164 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2164, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_704_output_0", "outputIndexes": [ 2165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8795", "outputIndexes": [ 2166 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2159 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8798", "outputIndexes": [ 2167 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2155, 2166, 2167, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8801", "outputIndexes": [ 2168 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2168 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8802", "outputIndexes": [ 2169 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2169 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8803", "outputIndexes": [ 2170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2170, 2169 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8804", "outputIndexes": [ 2171 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2154, 2171, 2157 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_337_output_0", "outputIndexes": [ 2172 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2172, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_705_output_0", "outputIndexes": [ 2173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2165, 2173, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_286_output_0", "outputIndexes": [ 2174 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2153, 2174 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_199_output_0", "outputIndexes": [ 2175 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2175 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1395248466, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_22/Mul_1_output_0", "outputIndexes": [ 2177 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_176_output_0", "outputIndexes": [ 2178 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177 ] , "main_type": "NONE", "name": "/Shape_310_output_0", "outputIndexes": [ 2179 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2179 ] , "main_type": "NONE", "name": "Shape8923", "outputIndexes": [ 2180 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2179 ] , "main_type": "NONE", "name": "Rank8925", "outputIndexes": [ 2181 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2181, 2181 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8927", "outputIndexes": [ 2182 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2182 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8928", "outputIndexes": [ 2183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2182, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8930", "outputIndexes": [ 2184 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2184 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8931", "outputIndexes": [ 2185 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2180, 2183, 2185, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8934", "outputIndexes": [ 2186 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8935", "outputIndexes": [ 2187 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2187 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8936", "outputIndexes": [ 2188 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188, 2187 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8937", "outputIndexes": [ 2189 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2179, 2189, 2182 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_338_output_0", "outputIndexes": [ 2190 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2190, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_66_output_0", "outputIndexes": [ 2191 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2191, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_711_output_0", "outputIndexes": [ 2192 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177, 2192, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_89_output_0", "outputIndexes": [ 2193 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2193 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_44_output_0", "outputIndexes": [ 2194 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2191, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_710_output_0", "outputIndexes": [ 2195 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177, 22, 2195, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_88_output_0", "outputIndexes": [ 2196 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2194, 2196 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_289_output_0", "outputIndexes": [ 2197 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2197, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_177_output_0", "outputIndexes": [ 2198 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2178, 2198 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_113_output_0", "outputIndexes": [ 2199 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4073 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1395249490, 1310742, 327680, 0, 0 ] } , "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": [ 4078 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4078 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4079 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4079 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2200 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2164, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_706_output_0", "outputIndexes": [ 2201 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2172, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_707_output_0", "outputIndexes": [ 2202 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2201, 2202, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_287_output_0", "outputIndexes": [ 2203 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2200, 2203 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_200_output_0", "outputIndexes": [ 2204 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2204 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1396887912, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_22/Mul_1_output_0", "outputIndexes": [ 2206 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_178_output_0", "outputIndexes": [ 2207 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206 ] , "main_type": "NONE", "name": "/Shape_311_output_0", "outputIndexes": [ 2208 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2208 ] , "main_type": "NONE", "name": "Shape8819", "outputIndexes": [ 2209 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2208 ] , "main_type": "NONE", "name": "Rank8821", "outputIndexes": [ 2210 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2210, 2210 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8823", "outputIndexes": [ 2211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8824", "outputIndexes": [ 2212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8826", "outputIndexes": [ 2213 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2213 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8827", "outputIndexes": [ 2214 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2209, 2212, 2214, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8830", "outputIndexes": [ 2215 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8831", "outputIndexes": [ 2216 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2216 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8832", "outputIndexes": [ 2217 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2217, 2216 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8833", "outputIndexes": [ 2218 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208, 2218, 2211 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_339_output_0", "outputIndexes": [ 2219 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2219, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_67_output_0", "outputIndexes": [ 2220 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_713_output_0", "outputIndexes": [ 2221 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 2221, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_91_output_0", "outputIndexes": [ 2222 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2222 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_45_output_0", "outputIndexes": [ 2223 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_712_output_0", "outputIndexes": [ 2224 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2206, 22, 2224, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_90_output_0", "outputIndexes": [ 2225 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2223, 2225 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_290_output_0", "outputIndexes": [ 2226 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2226, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_179_output_0", "outputIndexes": [ 2227 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2207, 2227 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_114_output_0", "outputIndexes": [ 2228 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4073 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1396888936, 1310742, 327680, 0, 0 ] } , "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": [ 4082 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4082 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4083 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4083 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2229 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2164, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_708_output_0", "outputIndexes": [ 2230 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2172, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_709_output_0", "outputIndexes": [ 2231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2230, 2231, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_288_output_0", "outputIndexes": [ 2232 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2229, 2232 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_201_output_0", "outputIndexes": [ 2233 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2199, 2228, 2233, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_206_output_0", "outputIndexes": [ 2234 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2234 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4084 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4084 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4085 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4085 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1398527358, 5242902, 1310720, 0, 0 ] } , "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": [ 4086 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4086 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4087 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4087 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2235 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151, 2235 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_116_output_0", "outputIndexes": [ 2236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2236 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1405080980, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_22/Mul_1_output_0", "outputIndexes": [ 2237 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2237 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4088 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4088 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4089 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4089 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1405101460, 12451862, 3112960, 0, 0 ] } , "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": [ 4090 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4090 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4091 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4091 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2238 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_22/Mul_output_0", "outputIndexes": [ 2239 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4089 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1420666282, 12451862, 3112960, 0, 0 ] } , "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": [ 4094 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4094 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4095 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4095 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2240 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2239, 2240 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_22/Mul_output_0", "outputIndexes": [ 2241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2241 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4096 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4096 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4097 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4097 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1436231104, 12451862, 3112960, 0, 0 ] } , "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": [ 4098 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4098 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4099 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4099 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2242 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2236, 2242 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_117_output_0", "outputIndexes": [ 2243 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2243, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_207_output_0", "outputIndexes": [ 2244 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2244 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1451795926, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_23/Mul_1_output_0", "outputIndexes": [ 2245 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2245 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4100 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4100 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4101 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4101 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1451816406, 5242902, 1310720, 0, 0 ] } , "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": [ 4102 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4102 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4103 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4103 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2246 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2245 ] , "main_type": "NONE", "name": "/Shape_322_output_0", "outputIndexes": [ 2247 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2247 ] , "main_type": "NONE", "name": "Shape9162", "outputIndexes": [ 2248 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2247 ] , "main_type": "NONE", "name": "Rank9164", "outputIndexes": [ 2249 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249, 2249 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9166", "outputIndexes": [ 2250 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2250 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9167", "outputIndexes": [ 2251 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2250, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9169", "outputIndexes": [ 2252 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2252 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9170", "outputIndexes": [ 2253 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2248, 2251, 2253, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9173", "outputIndexes": [ 2254 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2254 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9174", "outputIndexes": [ 2255 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2255, 2255 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9176", "outputIndexes": [ 2256 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2247, 2256, 2250 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_351_output_0", "outputIndexes": [ 2257 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_736_output_0", "outputIndexes": [ 2258 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2250 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9184", "outputIndexes": [ 2259 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2252 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9187", "outputIndexes": [ 2260 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2248, 2259, 2260, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9190", "outputIndexes": [ 2261 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2261 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9191", "outputIndexes": [ 2262 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2262 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9192", "outputIndexes": [ 2263 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2263, 2262 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9193", "outputIndexes": [ 2264 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2247, 2264, 2250 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_352_output_0", "outputIndexes": [ 2265 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_737_output_0", "outputIndexes": [ 2266 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2258, 2266, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_299_output_0", "outputIndexes": [ 2267 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2246, 2267 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_208_output_0", "outputIndexes": [ 2268 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2268 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1458370028, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_23/Mul_1_output_0", "outputIndexes": [ 2270 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_184_output_0", "outputIndexes": [ 2271 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270 ] , "main_type": "NONE", "name": "/Shape_324_output_0", "outputIndexes": [ 2272 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2272 ] , "main_type": "NONE", "name": "Shape9312", "outputIndexes": [ 2273 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2272 ] , "main_type": "NONE", "name": "Rank9314", "outputIndexes": [ 2274 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2274, 2274 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9316", "outputIndexes": [ 2275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2275 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9317", "outputIndexes": [ 2276 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2275, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9319", "outputIndexes": [ 2277 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9320", "outputIndexes": [ 2278 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273, 2276, 2278, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9323", "outputIndexes": [ 2279 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2279 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9324", "outputIndexes": [ 2280 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2280 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9325", "outputIndexes": [ 2281 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281, 2280 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9326", "outputIndexes": [ 2282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2272, 2282, 2275 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_353_output_0", "outputIndexes": [ 2283 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2283, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_69_output_0", "outputIndexes": [ 2284 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_743_output_0", "outputIndexes": [ 2285 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270, 2285, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_93_output_0", "outputIndexes": [ 2286 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_46_output_0", "outputIndexes": [ 2287 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_742_output_0", "outputIndexes": [ 2288 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270, 22, 2288, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_92_output_0", "outputIndexes": [ 2289 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2287, 2289 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_302_output_0", "outputIndexes": [ 2290 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2290, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_185_output_0", "outputIndexes": [ 2291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271, 2291 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_118_output_0", "outputIndexes": [ 2292 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4101 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1458371052, 1310742, 327680, 0, 0 ] } , "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": [ 4106 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4106 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4107 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4107 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2293 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_738_output_0", "outputIndexes": [ 2294 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_739_output_0", "outputIndexes": [ 2295 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2294, 2295, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_300_output_0", "outputIndexes": [ 2296 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2293, 2296 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_209_output_0", "outputIndexes": [ 2297 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1460009474, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_23/Mul_1_output_0", "outputIndexes": [ 2299 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_186_output_0", "outputIndexes": [ 2300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299 ] , "main_type": "NONE", "name": "/Shape_325_output_0", "outputIndexes": [ 2301 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2301 ] , "main_type": "NONE", "name": "Shape9208", "outputIndexes": [ 2302 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2301 ] , "main_type": "NONE", "name": "Rank9210", "outputIndexes": [ 2303 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2303, 2303 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9212", "outputIndexes": [ 2304 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9213", "outputIndexes": [ 2305 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9215", "outputIndexes": [ 2306 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2306 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9216", "outputIndexes": [ 2307 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2302, 2305, 2307, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9219", "outputIndexes": [ 2308 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2308 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9220", "outputIndexes": [ 2309 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2309 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9221", "outputIndexes": [ 2310 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2310, 2309 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9222", "outputIndexes": [ 2311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2301, 2311, 2304 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_354_output_0", "outputIndexes": [ 2312 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2312, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_70_output_0", "outputIndexes": [ 2313 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2313, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_745_output_0", "outputIndexes": [ 2314 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 2314, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_95_output_0", "outputIndexes": [ 2315 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2315 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_47_output_0", "outputIndexes": [ 2316 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2313, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_744_output_0", "outputIndexes": [ 2317 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299, 22, 2317, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_94_output_0", "outputIndexes": [ 2318 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2316, 2318 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_303_output_0", "outputIndexes": [ 2319 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2319, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_187_output_0", "outputIndexes": [ 2320 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300, 2320 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_119_output_0", "outputIndexes": [ 2321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4101 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1460010498, 1310742, 327680, 0, 0 ] } , "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": [ 4110 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4110 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4111 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4111 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2322 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_740_output_0", "outputIndexes": [ 2323 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_741_output_0", "outputIndexes": [ 2324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2323, 2324, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_301_output_0", "outputIndexes": [ 2325 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2322, 2325 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_210_output_0", "outputIndexes": [ 2326 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292, 2321, 2326, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_215_output_0", "outputIndexes": [ 2327 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4112 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4112 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4113 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4113 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1461648920, 5242902, 1310720, 0, 0 ] } , "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": [ 4114 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4114 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4115 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4115 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2328 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2244, 2328 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_121_output_0", "outputIndexes": [ 2329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1468202542, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_23/Mul_1_output_0", "outputIndexes": [ 2330 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2330 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4116 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4116 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4117 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4117 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1468223022, 12451862, 3112960, 0, 0 ] } , "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": [ 4118 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4118 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4119 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4119 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2331 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2331 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_23/Mul_output_0", "outputIndexes": [ 2332 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4117 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1483787844, 12451862, 3112960, 0, 0 ] } , "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": [ 4122 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4122 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4123 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4123 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2333 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2332, 2333 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_23/Mul_output_0", "outputIndexes": [ 2334 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2334 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4124 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4124 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4125 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4125 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1499352666, 12451862, 3112960, 0, 0 ] } , "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": [ 4126 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4126 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4127 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4127 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2335 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329, 2335 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_122_output_0", "outputIndexes": [ 2336 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_216_output_0", "outputIndexes": [ 2337 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2337 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1514917488, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_24/Mul_1_output_0", "outputIndexes": [ 2338 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4128 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4128 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4129 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4129 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1514937968, 5242902, 1310720, 0, 0 ] } , "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": [ 4130 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4130 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4131 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4131 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2339 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338 ] , "main_type": "NONE", "name": "/Shape_336_output_0", "outputIndexes": [ 2340 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2340 ] , "main_type": "NONE", "name": "Shape9551", "outputIndexes": [ 2341 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2340 ] , "main_type": "NONE", "name": "Rank9553", "outputIndexes": [ 2342 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2342, 2342 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9555", "outputIndexes": [ 2343 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2343 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9556", "outputIndexes": [ 2344 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2343, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9558", "outputIndexes": [ 2345 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2345 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9559", "outputIndexes": [ 2346 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2341, 2344, 2346, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9562", "outputIndexes": [ 2347 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2347 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9563", "outputIndexes": [ 2348 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2348, 2348 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9565", "outputIndexes": [ 2349 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2340, 2349, 2343 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_366_output_0", "outputIndexes": [ 2350 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2350, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_768_output_0", "outputIndexes": [ 2351 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2343 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9573", "outputIndexes": [ 2352 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2345 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9576", "outputIndexes": [ 2353 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2341, 2352, 2353, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9579", "outputIndexes": [ 2354 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2354 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9580", "outputIndexes": [ 2355 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2355 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9581", "outputIndexes": [ 2356 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2356, 2355 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9582", "outputIndexes": [ 2357 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2340, 2357, 2343 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_367_output_0", "outputIndexes": [ 2358 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2358, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_769_output_0", "outputIndexes": [ 2359 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2351, 2359, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_312_output_0", "outputIndexes": [ 2360 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2339, 2360 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_217_output_0", "outputIndexes": [ 2361 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1521491590, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_24/Mul_1_output_0", "outputIndexes": [ 2363 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_192_output_0", "outputIndexes": [ 2364 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363 ] , "main_type": "NONE", "name": "/Shape_338_output_0", "outputIndexes": [ 2365 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2365 ] , "main_type": "NONE", "name": "Shape9701", "outputIndexes": [ 2366 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2365 ] , "main_type": "NONE", "name": "Rank9703", "outputIndexes": [ 2367 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2367, 2367 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9705", "outputIndexes": [ 2368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9706", "outputIndexes": [ 2369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9708", "outputIndexes": [ 2370 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9709", "outputIndexes": [ 2371 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366, 2369, 2371, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9712", "outputIndexes": [ 2372 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9713", "outputIndexes": [ 2373 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2373 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9714", "outputIndexes": [ 2374 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2374, 2373 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9715", "outputIndexes": [ 2375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2365, 2375, 2368 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_368_output_0", "outputIndexes": [ 2376 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2376, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_72_output_0", "outputIndexes": [ 2377 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_775_output_0", "outputIndexes": [ 2378 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363, 2378, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_97_output_0", "outputIndexes": [ 2379 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_48_output_0", "outputIndexes": [ 2380 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_774_output_0", "outputIndexes": [ 2381 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2363, 22, 2381, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_96_output_0", "outputIndexes": [ 2382 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2380, 2382 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_315_output_0", "outputIndexes": [ 2383 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_193_output_0", "outputIndexes": [ 2384 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364, 2384 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_123_output_0", "outputIndexes": [ 2385 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4129 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1521492614, 1310742, 327680, 0, 0 ] } , "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": [ 4134 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4134 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4135 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4135 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2386 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2350, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_770_output_0", "outputIndexes": [ 2387 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2358, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_771_output_0", "outputIndexes": [ 2388 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2387, 2388, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_313_output_0", "outputIndexes": [ 2389 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2386, 2389 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_218_output_0", "outputIndexes": [ 2390 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2390 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1523131036, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_24/Mul_1_output_0", "outputIndexes": [ 2392 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_194_output_0", "outputIndexes": [ 2393 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392 ] , "main_type": "NONE", "name": "/Shape_339_output_0", "outputIndexes": [ 2394 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2394 ] , "main_type": "NONE", "name": "Shape9597", "outputIndexes": [ 2395 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2394 ] , "main_type": "NONE", "name": "Rank9599", "outputIndexes": [ 2396 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2396, 2396 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9601", "outputIndexes": [ 2397 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9602", "outputIndexes": [ 2398 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9604", "outputIndexes": [ 2399 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2399 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9605", "outputIndexes": [ 2400 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395, 2398, 2400, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9608", "outputIndexes": [ 2401 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2401 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9609", "outputIndexes": [ 2402 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2402 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9610", "outputIndexes": [ 2403 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2403, 2402 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9611", "outputIndexes": [ 2404 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2394, 2404, 2397 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_369_output_0", "outputIndexes": [ 2405 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2405, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_73_output_0", "outputIndexes": [ 2406 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_777_output_0", "outputIndexes": [ 2407 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392, 2407, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_99_output_0", "outputIndexes": [ 2408 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2408 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_49_output_0", "outputIndexes": [ 2409 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_776_output_0", "outputIndexes": [ 2410 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392, 22, 2410, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_98_output_0", "outputIndexes": [ 2411 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2409, 2411 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_316_output_0", "outputIndexes": [ 2412 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2412, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_195_output_0", "outputIndexes": [ 2413 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2393, 2413 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_124_output_0", "outputIndexes": [ 2414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4129 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1523132060, 1310742, 327680, 0, 0 ] } , "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": [ 4138 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4138 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4139 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4139 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2415 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2350, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_772_output_0", "outputIndexes": [ 2416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2358, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_773_output_0", "outputIndexes": [ 2417 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2416, 2417, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_314_output_0", "outputIndexes": [ 2418 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2415, 2418 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_219_output_0", "outputIndexes": [ 2419 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2385, 2414, 2419, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_224_output_0", "outputIndexes": [ 2420 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2420 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4140 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4140 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4141 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4141 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1524770482, 5242902, 1310720, 0, 0 ] } , "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": [ 4142 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4142 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4143 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4143 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2421 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2337, 2421 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_126_output_0", "outputIndexes": [ 2422 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2422 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1531324104, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_24/Mul_1_output_0", "outputIndexes": [ 2423 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2423 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4144 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4144 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4145 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4145 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1531344584, 12451862, 3112960, 0, 0 ] } , "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": [ 4146 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4146 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4147 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4147 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2424 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2424 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_24/Mul_output_0", "outputIndexes": [ 2425 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4145 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1546909406, 12451862, 3112960, 0, 0 ] } , "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": [ 4150 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4150 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4151 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4151 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2426 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2425, 2426 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_24/Mul_output_0", "outputIndexes": [ 2427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4152 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4152 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4153 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4153 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1562474228, 12451862, 3112960, 0, 0 ] } , "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": [ 4154 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4154 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4155 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4155 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2428 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2422, 2428 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_127_output_0", "outputIndexes": [ 2429 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2429, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_225_output_0", "outputIndexes": [ 2430 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2430 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1578039050, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_25/Mul_1_output_0", "outputIndexes": [ 2431 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2431 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4156 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4156 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4157 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4157 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1578059530, 5242902, 1310720, 0, 0 ] } , "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": [ 4158 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4158 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4159 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4159 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2432 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2431 ] , "main_type": "NONE", "name": "/Shape_350_output_0", "outputIndexes": [ 2433 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2433 ] , "main_type": "NONE", "name": "Shape9940", "outputIndexes": [ 2434 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2433 ] , "main_type": "NONE", "name": "Rank9942", "outputIndexes": [ 2435 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2435, 2435 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9944", "outputIndexes": [ 2436 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2436 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9945", "outputIndexes": [ 2437 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2436, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9947", "outputIndexes": [ 2438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2438 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9948", "outputIndexes": [ 2439 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2434, 2437, 2439, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9951", "outputIndexes": [ 2440 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2440 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9952", "outputIndexes": [ 2441 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2441, 2441 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9954", "outputIndexes": [ 2442 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2433, 2442, 2436 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_381_output_0", "outputIndexes": [ 2443 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_800_output_0", "outputIndexes": [ 2444 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2436 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9962", "outputIndexes": [ 2445 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2438 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9965", "outputIndexes": [ 2446 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2434, 2445, 2446, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9968", "outputIndexes": [ 2447 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2447 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9969", "outputIndexes": [ 2448 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2448 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9970", "outputIndexes": [ 2449 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2449, 2448 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9971", "outputIndexes": [ 2450 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2433, 2450, 2436 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_382_output_0", "outputIndexes": [ 2451 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_801_output_0", "outputIndexes": [ 2452 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2444, 2452, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_325_output_0", "outputIndexes": [ 2453 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2432, 2453 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_226_output_0", "outputIndexes": [ 2454 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1584613152, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_25/Mul_1_output_0", "outputIndexes": [ 2456 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_200_output_0", "outputIndexes": [ 2457 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456 ] , "main_type": "NONE", "name": "/Shape_352_output_0", "outputIndexes": [ 2458 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2458 ] , "main_type": "NONE", "name": "Shape10090", "outputIndexes": [ 2459 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2458 ] , "main_type": "NONE", "name": "Rank10092", "outputIndexes": [ 2460 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2460, 2460 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10094", "outputIndexes": [ 2461 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2461 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10095", "outputIndexes": [ 2462 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2461, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10097", "outputIndexes": [ 2463 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2463 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10098", "outputIndexes": [ 2464 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2459, 2462, 2464, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10101", "outputIndexes": [ 2465 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2465 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10102", "outputIndexes": [ 2466 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2466 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10103", "outputIndexes": [ 2467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467, 2466 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10104", "outputIndexes": [ 2468 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2458, 2468, 2461 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_383_output_0", "outputIndexes": [ 2469 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2469, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_75_output_0", "outputIndexes": [ 2470 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_807_output_0", "outputIndexes": [ 2471 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456, 2471, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_101_output_0", "outputIndexes": [ 2472 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_50_output_0", "outputIndexes": [ 2473 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2470, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_806_output_0", "outputIndexes": [ 2474 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456, 22, 2474, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_100_output_0", "outputIndexes": [ 2475 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2473, 2475 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_328_output_0", "outputIndexes": [ 2476 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2476, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_201_output_0", "outputIndexes": [ 2477 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457, 2477 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_128_output_0", "outputIndexes": [ 2478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4157 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1584614176, 1310742, 327680, 0, 0 ] } , "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": [ 4162 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4162 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4163 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4163 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2479 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_802_output_0", "outputIndexes": [ 2480 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_803_output_0", "outputIndexes": [ 2481 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2480, 2481, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_326_output_0", "outputIndexes": [ 2482 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2479, 2482 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_227_output_0", "outputIndexes": [ 2483 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2483 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1586252598, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_25/Mul_1_output_0", "outputIndexes": [ 2485 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_202_output_0", "outputIndexes": [ 2486 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485 ] , "main_type": "NONE", "name": "/Shape_353_output_0", "outputIndexes": [ 2487 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2487 ] , "main_type": "NONE", "name": "Shape9986", "outputIndexes": [ 2488 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2487 ] , "main_type": "NONE", "name": "Rank9988", "outputIndexes": [ 2489 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2489, 2489 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9990", "outputIndexes": [ 2490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9991", "outputIndexes": [ 2491 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9993", "outputIndexes": [ 2492 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2492 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze9994", "outputIndexes": [ 2493 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488, 2491, 2493, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice9997", "outputIndexes": [ 2494 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2494 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze9998", "outputIndexes": [ 2495 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2495 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp9999", "outputIndexes": [ 2496 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2496, 2495 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10000", "outputIndexes": [ 2497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2487, 2497, 2490 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_384_output_0", "outputIndexes": [ 2498 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2498, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_76_output_0", "outputIndexes": [ 2499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2499, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_809_output_0", "outputIndexes": [ 2500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485, 2500, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_103_output_0", "outputIndexes": [ 2501 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_51_output_0", "outputIndexes": [ 2502 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2499, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_808_output_0", "outputIndexes": [ 2503 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485, 22, 2503, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_102_output_0", "outputIndexes": [ 2504 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2502, 2504 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_329_output_0", "outputIndexes": [ 2505 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2505, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_203_output_0", "outputIndexes": [ 2506 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2486, 2506 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_129_output_0", "outputIndexes": [ 2507 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4157 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1586253622, 1310742, 327680, 0, 0 ] } , "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": [ 4166 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4166 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4167 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4167 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2508 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2443, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_804_output_0", "outputIndexes": [ 2509 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_805_output_0", "outputIndexes": [ 2510 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2509, 2510, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_327_output_0", "outputIndexes": [ 2511 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2508, 2511 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_228_output_0", "outputIndexes": [ 2512 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478, 2507, 2512, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_233_output_0", "outputIndexes": [ 2513 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2513 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4168 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4168 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4169 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4169 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1587892044, 5242902, 1310720, 0, 0 ] } , "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": [ 4170 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4170 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4171 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4171 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2514 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2430, 2514 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_131_output_0", "outputIndexes": [ 2515 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2515 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1594445666, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_25/Mul_1_output_0", "outputIndexes": [ 2516 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2516 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4172 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4172 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4173 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4173 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1594466146, 12451862, 3112960, 0, 0 ] } , "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": [ 4174 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4174 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4175 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4175 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2517 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2517 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_25/Mul_output_0", "outputIndexes": [ 2518 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4173 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1610030968, 12451862, 3112960, 0, 0 ] } , "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": [ 4178 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4178 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4179 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4179 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2519 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2518, 2519 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_25/Mul_output_0", "outputIndexes": [ 2520 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2520 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4180 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4180 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4181 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4181 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1625595790, 12451862, 3112960, 0, 0 ] } , "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": [ 4182 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4182 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4183 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4183 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2521 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2515, 2521 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_132_output_0", "outputIndexes": [ 2522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2522, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_234_output_0", "outputIndexes": [ 2523 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1641160612, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_26/Mul_1_output_0", "outputIndexes": [ 2524 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4184 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4184 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4185 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4185 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1641181092, 5242902, 1310720, 0, 0 ] } , "name": "/layers.26/self_attn/q_proj/Linear", "outputIndexes": [ 4186 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4186 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4187 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4187 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2525 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524 ] , "main_type": "NONE", "name": "/Shape_364_output_0", "outputIndexes": [ 2526 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2526 ] , "main_type": "NONE", "name": "Shape10329", "outputIndexes": [ 2527 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2526 ] , "main_type": "NONE", "name": "Rank10331", "outputIndexes": [ 2528 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2528, 2528 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10333", "outputIndexes": [ 2529 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2529 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10334", "outputIndexes": [ 2530 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2529, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10336", "outputIndexes": [ 2531 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2531 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10337", "outputIndexes": [ 2532 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2527, 2530, 2532, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10340", "outputIndexes": [ 2533 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2533 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10341", "outputIndexes": [ 2534 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2534, 2534 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10343", "outputIndexes": [ 2535 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2526, 2535, 2529 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_396_output_0", "outputIndexes": [ 2536 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2536, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_832_output_0", "outputIndexes": [ 2537 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2529 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10351", "outputIndexes": [ 2538 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2531 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10354", "outputIndexes": [ 2539 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2527, 2538, 2539, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10357", "outputIndexes": [ 2540 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2540 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10358", "outputIndexes": [ 2541 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2541 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10359", "outputIndexes": [ 2542 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2542, 2541 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10360", "outputIndexes": [ 2543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2526, 2543, 2529 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_397_output_0", "outputIndexes": [ 2544 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_833_output_0", "outputIndexes": [ 2545 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2537, 2545, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_338_output_0", "outputIndexes": [ 2546 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2525, 2546 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_235_output_0", "outputIndexes": [ 2547 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2547 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1647734714, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_26/Mul_1_output_0", "outputIndexes": [ 2549 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_208_output_0", "outputIndexes": [ 2550 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549 ] , "main_type": "NONE", "name": "/Shape_366_output_0", "outputIndexes": [ 2551 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2551 ] , "main_type": "NONE", "name": "Shape10479", "outputIndexes": [ 2552 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2551 ] , "main_type": "NONE", "name": "Rank10481", "outputIndexes": [ 2553 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2553, 2553 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10483", "outputIndexes": [ 2554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2554 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10484", "outputIndexes": [ 2555 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2554, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10486", "outputIndexes": [ 2556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2556 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10487", "outputIndexes": [ 2557 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2552, 2555, 2557, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10490", "outputIndexes": [ 2558 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2558 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10491", "outputIndexes": [ 2559 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2559 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10492", "outputIndexes": [ 2560 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2560, 2559 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10493", "outputIndexes": [ 2561 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551, 2561, 2554 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_398_output_0", "outputIndexes": [ 2562 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_78_output_0", "outputIndexes": [ 2563 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_839_output_0", "outputIndexes": [ 2564 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549, 2564, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_105_output_0", "outputIndexes": [ 2565 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2565 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_52_output_0", "outputIndexes": [ 2566 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_838_output_0", "outputIndexes": [ 2567 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549, 22, 2567, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_104_output_0", "outputIndexes": [ 2568 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2566, 2568 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_341_output_0", "outputIndexes": [ 2569 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2569, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_209_output_0", "outputIndexes": [ 2570 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2550, 2570 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_133_output_0", "outputIndexes": [ 2571 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4185 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1647735738, 1310742, 327680, 0, 0 ] } , "name": "/layers.26/self_attn/k_proj/Linear", "outputIndexes": [ 4190 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4190 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4191 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4191 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2572 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2536, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_834_output_0", "outputIndexes": [ 2573 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_835_output_0", "outputIndexes": [ 2574 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2573, 2574, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_339_output_0", "outputIndexes": [ 2575 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2572, 2575 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_236_output_0", "outputIndexes": [ 2576 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2576 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1649374160, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_26/Mul_1_output_0", "outputIndexes": [ 2578 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_210_output_0", "outputIndexes": [ 2579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578 ] , "main_type": "NONE", "name": "/Shape_367_output_0", "outputIndexes": [ 2580 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2580 ] , "main_type": "NONE", "name": "Shape10375", "outputIndexes": [ 2581 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2580 ] , "main_type": "NONE", "name": "Rank10377", "outputIndexes": [ 2582 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2582, 2582 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10379", "outputIndexes": [ 2583 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10380", "outputIndexes": [ 2584 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2583, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10382", "outputIndexes": [ 2585 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2585 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10383", "outputIndexes": [ 2586 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2581, 2584, 2586, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10386", "outputIndexes": [ 2587 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2587 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10387", "outputIndexes": [ 2588 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2588 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10388", "outputIndexes": [ 2589 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589, 2588 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10389", "outputIndexes": [ 2590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2580, 2590, 2583 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_399_output_0", "outputIndexes": [ 2591 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_79_output_0", "outputIndexes": [ 2592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_841_output_0", "outputIndexes": [ 2593 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 2593, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_107_output_0", "outputIndexes": [ 2594 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_53_output_0", "outputIndexes": [ 2595 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_840_output_0", "outputIndexes": [ 2596 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578, 22, 2596, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_106_output_0", "outputIndexes": [ 2597 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2595, 2597 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_342_output_0", "outputIndexes": [ 2598 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2598, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_211_output_0", "outputIndexes": [ 2599 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2579, 2599 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_134_output_0", "outputIndexes": [ 2600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4185 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1649375184, 1310742, 327680, 0, 0 ] } , "name": "/layers.26/self_attn/v_proj/Linear", "outputIndexes": [ 4194 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4194 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4195 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4195 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2601 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2536, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_836_output_0", "outputIndexes": [ 2602 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_837_output_0", "outputIndexes": [ 2603 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602, 2603, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_340_output_0", "outputIndexes": [ 2604 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2601, 2604 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_237_output_0", "outputIndexes": [ 2605 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2571, 2600, 2605, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_242_output_0", "outputIndexes": [ 2606 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2606 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4196 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4196 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4197 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4197 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1651013606, 5242902, 1310720, 0, 0 ] } , "name": "/layers.26/self_attn/o_proj/Linear", "outputIndexes": [ 4198 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4198 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4199 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4199 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2607 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523, 2607 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_136_output_0", "outputIndexes": [ 2608 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2608 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1657567228, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_26/Mul_1_output_0", "outputIndexes": [ 2609 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2609 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4200 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4200 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4201 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4201 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1657587708, 12451862, 3112960, 0, 0 ] } , "name": "/layers.26/mlp/gate_proj/Linear", "outputIndexes": [ 4202 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4202 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4203 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4203 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2610 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2610 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_26/Mul_output_0", "outputIndexes": [ 2611 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4201 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1673152530, 12451862, 3112960, 0, 0 ] } , "name": "/layers.26/mlp/up_proj/Linear", "outputIndexes": [ 4206 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4206 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4207 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4207 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2612 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2611, 2612 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_26/Mul_output_0", "outputIndexes": [ 2613 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2613 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4208 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4208 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4209 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4209 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1688717352, 12451862, 3112960, 0, 0 ] } , "name": "/layers.26/mlp/down_proj/Linear", "outputIndexes": [ 4210 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4210 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4211 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4211 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2614 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2608, 2614 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_137_output_0", "outputIndexes": [ 2615 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2615, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_243_output_0", "outputIndexes": [ 2616 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2616 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1704282174, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_27/Mul_1_output_0", "outputIndexes": [ 2617 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4212 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4212 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4213 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4213 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1704302654, 5242902, 1310720, 0, 0 ] } , "name": "/layers.27/self_attn/q_proj/Linear", "outputIndexes": [ 4214 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4214 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4215 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4215 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2618 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617 ] , "main_type": "NONE", "name": "/Shape_378_output_0", "outputIndexes": [ 2619 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2619 ] , "main_type": "NONE", "name": "Shape10718", "outputIndexes": [ 2620 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2619 ] , "main_type": "NONE", "name": "Rank10720", "outputIndexes": [ 2621 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2621, 2621 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10722", "outputIndexes": [ 2622 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10723", "outputIndexes": [ 2623 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10725", "outputIndexes": [ 2624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2624 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10726", "outputIndexes": [ 2625 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2620, 2623, 2625, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10729", "outputIndexes": [ 2626 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2626 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10730", "outputIndexes": [ 2627 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2627, 2627 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10732", "outputIndexes": [ 2628 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619, 2628, 2622 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_411_output_0", "outputIndexes": [ 2629 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_864_output_0", "outputIndexes": [ 2630 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10740", "outputIndexes": [ 2631 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2624 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10743", "outputIndexes": [ 2632 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2620, 2631, 2632, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10746", "outputIndexes": [ 2633 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10747", "outputIndexes": [ 2634 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2634 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10748", "outputIndexes": [ 2635 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635, 2634 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10749", "outputIndexes": [ 2636 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619, 2636, 2622 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_412_output_0", "outputIndexes": [ 2637 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_865_output_0", "outputIndexes": [ 2638 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630, 2638, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_351_output_0", "outputIndexes": [ 2639 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2618, 2639 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_244_output_0", "outputIndexes": [ 2640 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1710856276, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_27/Mul_1_output_0", "outputIndexes": [ 2642 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_216_output_0", "outputIndexes": [ 2643 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642 ] , "main_type": "NONE", "name": "/Shape_380_output_0", "outputIndexes": [ 2644 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2644 ] , "main_type": "NONE", "name": "Shape10868", "outputIndexes": [ 2645 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2644 ] , "main_type": "NONE", "name": "Rank10870", "outputIndexes": [ 2646 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2646, 2646 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10872", "outputIndexes": [ 2647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2647 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10873", "outputIndexes": [ 2648 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2647, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10875", "outputIndexes": [ 2649 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10876", "outputIndexes": [ 2650 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2645, 2648, 2650, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10879", "outputIndexes": [ 2651 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10880", "outputIndexes": [ 2652 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2652 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10881", "outputIndexes": [ 2653 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653, 2652 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10882", "outputIndexes": [ 2654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2644, 2654, 2647 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_413_output_0", "outputIndexes": [ 2655 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2655, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_81_output_0", "outputIndexes": [ 2656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_871_output_0", "outputIndexes": [ 2657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 2657, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_109_output_0", "outputIndexes": [ 2658 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2658 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_54_output_0", "outputIndexes": [ 2659 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_870_output_0", "outputIndexes": [ 2660 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2642, 22, 2660, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_108_output_0", "outputIndexes": [ 2661 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2659, 2661 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_354_output_0", "outputIndexes": [ 2662 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2662, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_217_output_0", "outputIndexes": [ 2663 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2643, 2663 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_138_output_0", "outputIndexes": [ 2664 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4213 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1710857300, 1310742, 327680, 0, 0 ] } , "name": "/layers.27/self_attn/k_proj/Linear", "outputIndexes": [ 4218 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4218 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4219 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4219 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_866_output_0", "outputIndexes": [ 2666 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_867_output_0", "outputIndexes": [ 2667 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2666, 2667, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_352_output_0", "outputIndexes": [ 2668 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2665, 2668 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_245_output_0", "outputIndexes": [ 2669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2669 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1712495722, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_27/Mul_1_output_0", "outputIndexes": [ 2671 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2671, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_218_output_0", "outputIndexes": [ 2672 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2671 ] , "main_type": "NONE", "name": "/Shape_381_output_0", "outputIndexes": [ 2673 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2673 ] , "main_type": "NONE", "name": "Shape10764", "outputIndexes": [ 2674 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2673 ] , "main_type": "NONE", "name": "Rank10766", "outputIndexes": [ 2675 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2675, 2675 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10768", "outputIndexes": [ 2676 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2676 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10769", "outputIndexes": [ 2677 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2676, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10771", "outputIndexes": [ 2678 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze10772", "outputIndexes": [ 2679 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2674, 2677, 2679, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice10775", "outputIndexes": [ 2680 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze10776", "outputIndexes": [ 2681 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2681 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10777", "outputIndexes": [ 2682 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2682, 2681 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp10778", "outputIndexes": [ 2683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2673, 2683, 2676 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_414_output_0", "outputIndexes": [ 2684 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2684, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_82_output_0", "outputIndexes": [ 2685 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2685, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_873_output_0", "outputIndexes": [ 2686 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2671, 2686, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_111_output_0", "outputIndexes": [ 2687 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_55_output_0", "outputIndexes": [ 2688 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2685, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_872_output_0", "outputIndexes": [ 2689 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2671, 22, 2689, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_110_output_0", "outputIndexes": [ 2690 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2688, 2690 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_355_output_0", "outputIndexes": [ 2691 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_219_output_0", "outputIndexes": [ 2692 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2672, 2692 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_139_output_0", "outputIndexes": [ 2693 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4213 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1712496746, 1310742, 327680, 0, 0 ] } , "name": "/layers.27/self_attn/v_proj/Linear", "outputIndexes": [ 4222 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4222 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4223 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4223 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2694 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_868_output_0", "outputIndexes": [ 2695 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_869_output_0", "outputIndexes": [ 2696 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2695, 2696, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_353_output_0", "outputIndexes": [ 2697 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2694, 2697 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_246_output_0", "outputIndexes": [ 2698 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2664, 2693, 2698, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_251_output_0", "outputIndexes": [ 2699 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2699 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4224 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4224 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4225 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4225 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1714135168, 5242902, 1310720, 0, 0 ] } , "name": "/layers.27/self_attn/o_proj/Linear", "outputIndexes": [ 4226 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4226 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4227 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4227 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2700 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2616, 2700 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_141_output_0", "outputIndexes": [ 2701 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2701 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1720688790, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_27/Mul_1_output_0", "outputIndexes": [ 2702 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2702 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4228 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4228 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4229 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4229 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1720709270, 12451862, 3112960, 0, 0 ] } , "name": "/layers.27/mlp/gate_proj/Linear", "outputIndexes": [ 4230 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4230 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4231 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4231 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2703 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2703 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_27/Mul_output_0", "outputIndexes": [ 2704 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4229 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1736274092, 12451862, 3112960, 0, 0 ] } , "name": "/layers.27/mlp/up_proj/Linear", "outputIndexes": [ 4234 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4234 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4235 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4235 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2705 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2704, 2705 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_27/Mul_output_0", "outputIndexes": [ 2706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2706 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4236 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4236 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4237 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4237 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1751838914, 12451862, 3112960, 0, 0 ] } , "name": "/layers.27/mlp/down_proj/Linear", "outputIndexes": [ 4238 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4238 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4239 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4239 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2707 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2701, 2707 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_142_output_0", "outputIndexes": [ 2708 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_252_output_0", "outputIndexes": [ 2709 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2709 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1767403736, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_28/Mul_1_output_0", "outputIndexes": [ 2710 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4240 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4240 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4241 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4241 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1767424216, 5242902, 1310720, 0, 0 ] } , "name": "/layers.28/self_attn/q_proj/Linear", "outputIndexes": [ 4242 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4242 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4243 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4243 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2711 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2710 ] , "main_type": "NONE", "name": "/Shape_392_output_0", "outputIndexes": [ 2712 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2712 ] , "main_type": "NONE", "name": "Shape11107", "outputIndexes": [ 2713 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2712 ] , "main_type": "NONE", "name": "Rank11109", "outputIndexes": [ 2714 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2714, 2714 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11111", "outputIndexes": [ 2715 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11112", "outputIndexes": [ 2716 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11114", "outputIndexes": [ 2717 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11115", "outputIndexes": [ 2718 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713, 2716, 2718, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11118", "outputIndexes": [ 2719 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11119", "outputIndexes": [ 2720 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720, 2720 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11121", "outputIndexes": [ 2721 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2712, 2721, 2715 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_426_output_0", "outputIndexes": [ 2722 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_896_output_0", "outputIndexes": [ 2723 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11129", "outputIndexes": [ 2724 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11132", "outputIndexes": [ 2725 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713, 2724, 2725, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11135", "outputIndexes": [ 2726 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2726 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11136", "outputIndexes": [ 2727 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2727 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11137", "outputIndexes": [ 2728 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2728, 2727 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11138", "outputIndexes": [ 2729 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2712, 2729, 2715 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_427_output_0", "outputIndexes": [ 2730 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2730, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_897_output_0", "outputIndexes": [ 2731 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2723, 2731, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_364_output_0", "outputIndexes": [ 2732 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2711, 2732 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_253_output_0", "outputIndexes": [ 2733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2733 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1773977838, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_28/Mul_1_output_0", "outputIndexes": [ 2735 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_224_output_0", "outputIndexes": [ 2736 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735 ] , "main_type": "NONE", "name": "/Shape_394_output_0", "outputIndexes": [ 2737 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2737 ] , "main_type": "NONE", "name": "Shape11257", "outputIndexes": [ 2738 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2737 ] , "main_type": "NONE", "name": "Rank11259", "outputIndexes": [ 2739 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2739, 2739 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11261", "outputIndexes": [ 2740 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11262", "outputIndexes": [ 2741 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11264", "outputIndexes": [ 2742 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11265", "outputIndexes": [ 2743 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2738, 2741, 2743, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11268", "outputIndexes": [ 2744 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2744 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11269", "outputIndexes": [ 2745 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2745 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11270", "outputIndexes": [ 2746 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2746, 2745 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11271", "outputIndexes": [ 2747 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737, 2747, 2740 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_428_output_0", "outputIndexes": [ 2748 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2748, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_84_output_0", "outputIndexes": [ 2749 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_903_output_0", "outputIndexes": [ 2750 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735, 2750, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_113_output_0", "outputIndexes": [ 2751 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2751 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_56_output_0", "outputIndexes": [ 2752 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_902_output_0", "outputIndexes": [ 2753 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735, 22, 2753, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_112_output_0", "outputIndexes": [ 2754 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2752, 2754 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_367_output_0", "outputIndexes": [ 2755 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2755, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_225_output_0", "outputIndexes": [ 2756 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2736, 2756 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_143_output_0", "outputIndexes": [ 2757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4241 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1773978862, 1310742, 327680, 0, 0 ] } , "name": "/layers.28/self_attn/k_proj/Linear", "outputIndexes": [ 4246 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4246 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4247 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4247 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2758 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_898_output_0", "outputIndexes": [ 2759 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2730, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_899_output_0", "outputIndexes": [ 2760 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2759, 2760, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_365_output_0", "outputIndexes": [ 2761 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2758, 2761 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_254_output_0", "outputIndexes": [ 2762 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2762 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1775617284, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_28/Mul_1_output_0", "outputIndexes": [ 2764 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_226_output_0", "outputIndexes": [ 2765 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764 ] , "main_type": "NONE", "name": "/Shape_395_output_0", "outputIndexes": [ 2766 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2766 ] , "main_type": "NONE", "name": "Shape11153", "outputIndexes": [ 2767 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2766 ] , "main_type": "NONE", "name": "Rank11155", "outputIndexes": [ 2768 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2768, 2768 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11157", "outputIndexes": [ 2769 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11158", "outputIndexes": [ 2770 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11160", "outputIndexes": [ 2771 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2771 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11161", "outputIndexes": [ 2772 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2767, 2770, 2772, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11164", "outputIndexes": [ 2773 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2773 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11165", "outputIndexes": [ 2774 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2774 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11166", "outputIndexes": [ 2775 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2775, 2774 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11167", "outputIndexes": [ 2776 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2766, 2776, 2769 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_429_output_0", "outputIndexes": [ 2777 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2777, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_85_output_0", "outputIndexes": [ 2778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2778, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_905_output_0", "outputIndexes": [ 2779 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764, 2779, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_115_output_0", "outputIndexes": [ 2780 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2780 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_57_output_0", "outputIndexes": [ 2781 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2778, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_904_output_0", "outputIndexes": [ 2782 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764, 22, 2782, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_114_output_0", "outputIndexes": [ 2783 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2781, 2783 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_368_output_0", "outputIndexes": [ 2784 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2784, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_227_output_0", "outputIndexes": [ 2785 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2765, 2785 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_144_output_0", "outputIndexes": [ 2786 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4241 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1775618308, 1310742, 327680, 0, 0 ] } , "name": "/layers.28/self_attn/v_proj/Linear", "outputIndexes": [ 4250 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4250 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4251 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4251 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2787 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2722, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_900_output_0", "outputIndexes": [ 2788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2730, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_901_output_0", "outputIndexes": [ 2789 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2788, 2789, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_366_output_0", "outputIndexes": [ 2790 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2787, 2790 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_255_output_0", "outputIndexes": [ 2791 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2757, 2786, 2791, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_260_output_0", "outputIndexes": [ 2792 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2792 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4252 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4252 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4253 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4253 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1777256730, 5242902, 1310720, 0, 0 ] } , "name": "/layers.28/self_attn/o_proj/Linear", "outputIndexes": [ 4254 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4254 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4255 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4255 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.28/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2793 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2709, 2793 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_146_output_0", "outputIndexes": [ 2794 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1783810352, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_28/Mul_1_output_0", "outputIndexes": [ 2795 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2795 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4256 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4256 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4257 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4257 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1783830832, 12451862, 3112960, 0, 0 ] } , "name": "/layers.28/mlp/gate_proj/Linear", "outputIndexes": [ 4258 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4258 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4259 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4259 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2796 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2796 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_28/Mul_output_0", "outputIndexes": [ 2797 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4257 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1799395654, 12451862, 3112960, 0, 0 ] } , "name": "/layers.28/mlp/up_proj/Linear", "outputIndexes": [ 4262 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4262 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4263 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4263 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2798 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797, 2798 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_28/Mul_output_0", "outputIndexes": [ 2799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4264 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4264 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.28/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4265 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4265 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1814960476, 12451862, 3112960, 0, 0 ] } , "name": "/layers.28/mlp/down_proj/Linear", "outputIndexes": [ 4266 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4266 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4267 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4267 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.28/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2800 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2794, 2800 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_147_output_0", "outputIndexes": [ 2801 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2801, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_261_output_0", "outputIndexes": [ 2802 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2802 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1830525298, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_29/Mul_1_output_0", "outputIndexes": [ 2803 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4268 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4268 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4269 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4269 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1830545778, 5242902, 1310720, 0, 0 ] } , "name": "/layers.29/self_attn/q_proj/Linear", "outputIndexes": [ 4270 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4270 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4271 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4271 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2804 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "NONE", "name": "/Shape_406_output_0", "outputIndexes": [ 2805 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2805 ] , "main_type": "NONE", "name": "Shape11496", "outputIndexes": [ 2806 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2805 ] , "main_type": "NONE", "name": "Rank11498", "outputIndexes": [ 2807 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2807, 2807 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11500", "outputIndexes": [ 2808 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11501", "outputIndexes": [ 2809 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11503", "outputIndexes": [ 2810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11504", "outputIndexes": [ 2811 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806, 2809, 2811, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11507", "outputIndexes": [ 2812 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2812 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11508", "outputIndexes": [ 2813 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813, 2813 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11510", "outputIndexes": [ 2814 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2805, 2814, 2808 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_441_output_0", "outputIndexes": [ 2815 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_928_output_0", "outputIndexes": [ 2816 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11518", "outputIndexes": [ 2817 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2810 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11521", "outputIndexes": [ 2818 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2806, 2817, 2818, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11524", "outputIndexes": [ 2819 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11525", "outputIndexes": [ 2820 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2820 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11526", "outputIndexes": [ 2821 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2821, 2820 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11527", "outputIndexes": [ 2822 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2805, 2822, 2808 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_442_output_0", "outputIndexes": [ 2823 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2823, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_929_output_0", "outputIndexes": [ 2824 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2816, 2824, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_377_output_0", "outputIndexes": [ 2825 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2804, 2825 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_262_output_0", "outputIndexes": [ 2826 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1837099400, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_29/Mul_1_output_0", "outputIndexes": [ 2828 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_232_output_0", "outputIndexes": [ 2829 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828 ] , "main_type": "NONE", "name": "/Shape_408_output_0", "outputIndexes": [ 2830 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2830 ] , "main_type": "NONE", "name": "Shape11646", "outputIndexes": [ 2831 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2830 ] , "main_type": "NONE", "name": "Rank11648", "outputIndexes": [ 2832 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2832, 2832 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11650", "outputIndexes": [ 2833 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2833 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11651", "outputIndexes": [ 2834 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2833, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11653", "outputIndexes": [ 2835 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2835 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11654", "outputIndexes": [ 2836 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831, 2834, 2836, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11657", "outputIndexes": [ 2837 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2837 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11658", "outputIndexes": [ 2838 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2838 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11659", "outputIndexes": [ 2839 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2839, 2838 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11660", "outputIndexes": [ 2840 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2830, 2840, 2833 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_443_output_0", "outputIndexes": [ 2841 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2841, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_87_output_0", "outputIndexes": [ 2842 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2842, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_935_output_0", "outputIndexes": [ 2843 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 2843, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_117_output_0", "outputIndexes": [ 2844 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2844 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_58_output_0", "outputIndexes": [ 2845 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2842, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_934_output_0", "outputIndexes": [ 2846 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828, 22, 2846, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_116_output_0", "outputIndexes": [ 2847 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845, 2847 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_380_output_0", "outputIndexes": [ 2848 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2848, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_233_output_0", "outputIndexes": [ 2849 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829, 2849 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_148_output_0", "outputIndexes": [ 2850 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4269 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1837100424, 1310742, 327680, 0, 0 ] } , "name": "/layers.29/self_attn/k_proj/Linear", "outputIndexes": [ 4274 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4274 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4275 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4275 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2851 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_930_output_0", "outputIndexes": [ 2852 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2823, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_931_output_0", "outputIndexes": [ 2853 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2852, 2853, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_378_output_0", "outputIndexes": [ 2854 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2851, 2854 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_263_output_0", "outputIndexes": [ 2855 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2855 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1838738846, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_29/Mul_1_output_0", "outputIndexes": [ 2857 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2857, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_234_output_0", "outputIndexes": [ 2858 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2857 ] , "main_type": "NONE", "name": "/Shape_409_output_0", "outputIndexes": [ 2859 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2859 ] , "main_type": "NONE", "name": "Shape11542", "outputIndexes": [ 2860 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2859 ] , "main_type": "NONE", "name": "Rank11544", "outputIndexes": [ 2861 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861, 2861 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11546", "outputIndexes": [ 2862 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2862 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11547", "outputIndexes": [ 2863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2862, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11549", "outputIndexes": [ 2864 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2864 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11550", "outputIndexes": [ 2865 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2860, 2863, 2865, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11553", "outputIndexes": [ 2866 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2866 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11554", "outputIndexes": [ 2867 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2867 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11555", "outputIndexes": [ 2868 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2868, 2867 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11556", "outputIndexes": [ 2869 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2859, 2869, 2862 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_444_output_0", "outputIndexes": [ 2870 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2870, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_88_output_0", "outputIndexes": [ 2871 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2871, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_937_output_0", "outputIndexes": [ 2872 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2857, 2872, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_119_output_0", "outputIndexes": [ 2873 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2873 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_59_output_0", "outputIndexes": [ 2874 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2871, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_936_output_0", "outputIndexes": [ 2875 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2857, 22, 2875, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_118_output_0", "outputIndexes": [ 2876 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2874, 2876 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_381_output_0", "outputIndexes": [ 2877 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2877, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_235_output_0", "outputIndexes": [ 2878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858, 2878 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_149_output_0", "outputIndexes": [ 2879 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4269 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1838739870, 1310742, 327680, 0, 0 ] } , "name": "/layers.29/self_attn/v_proj/Linear", "outputIndexes": [ 4278 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4278 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4279 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4279 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2880 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_932_output_0", "outputIndexes": [ 2881 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2823, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_933_output_0", "outputIndexes": [ 2882 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2881, 2882, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_379_output_0", "outputIndexes": [ 2883 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2880, 2883 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_264_output_0", "outputIndexes": [ 2884 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2850, 2879, 2884, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_269_output_0", "outputIndexes": [ 2885 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2885 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4280 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4280 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4281 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4281 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1840378292, 5242902, 1310720, 0, 0 ] } , "name": "/layers.29/self_attn/o_proj/Linear", "outputIndexes": [ 4282 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4282 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4283 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4283 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.29/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2886 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2802, 2886 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_151_output_0", "outputIndexes": [ 2887 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2887 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1846931914, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_29/Mul_1_output_0", "outputIndexes": [ 2888 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2888 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4284 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4284 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4285 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4285 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1846952394, 12451862, 3112960, 0, 0 ] } , "name": "/layers.29/mlp/gate_proj/Linear", "outputIndexes": [ 4286 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4286 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4287 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4287 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2889 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2889 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_29/Mul_output_0", "outputIndexes": [ 2890 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4285 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1862517216, 12451862, 3112960, 0, 0 ] } , "name": "/layers.29/mlp/up_proj/Linear", "outputIndexes": [ 4290 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4290 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4291 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4291 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2891 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2890, 2891 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_29/Mul_output_0", "outputIndexes": [ 2892 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2892 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4292 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4292 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.29/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4293 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4293 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1878082038, 12451862, 3112960, 0, 0 ] } , "name": "/layers.29/mlp/down_proj/Linear", "outputIndexes": [ 4294 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4294 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4295 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4295 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.29/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2893 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2887, 2893 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_152_output_0", "outputIndexes": [ 2894 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2894, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_270_output_0", "outputIndexes": [ 2895 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2895 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1893646860, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_30/Mul_1_output_0", "outputIndexes": [ 2896 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2896 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4296 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4296 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4297 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4297 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1893667340, 5242902, 1310720, 0, 0 ] } , "name": "/layers.30/self_attn/q_proj/Linear", "outputIndexes": [ 4298 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4298 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4299 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4299 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2897 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2896 ] , "main_type": "NONE", "name": "/Shape_420_output_0", "outputIndexes": [ 2898 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2898 ] , "main_type": "NONE", "name": "Shape11885", "outputIndexes": [ 2899 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2898 ] , "main_type": "NONE", "name": "Rank11887", "outputIndexes": [ 2900 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2900, 2900 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11889", "outputIndexes": [ 2901 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2901 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11890", "outputIndexes": [ 2902 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2901, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11892", "outputIndexes": [ 2903 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2903 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11893", "outputIndexes": [ 2904 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899, 2902, 2904, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11896", "outputIndexes": [ 2905 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2905 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11897", "outputIndexes": [ 2906 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2906, 2906 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11899", "outputIndexes": [ 2907 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2898, 2907, 2901 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_456_output_0", "outputIndexes": [ 2908 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2908, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_960_output_0", "outputIndexes": [ 2909 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2901 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11907", "outputIndexes": [ 2910 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2903 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11910", "outputIndexes": [ 2911 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2899, 2910, 2911, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11913", "outputIndexes": [ 2912 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2912 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11914", "outputIndexes": [ 2913 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 2913 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11915", "outputIndexes": [ 2914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2914, 2913 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11916", "outputIndexes": [ 2915 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2898, 2915, 2901 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_457_output_0", "outputIndexes": [ 2916 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_961_output_0", "outputIndexes": [ 2917 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2909, 2917, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_390_output_0", "outputIndexes": [ 2918 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2897, 2918 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_271_output_0", "outputIndexes": [ 2919 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2919 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1900220962, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_30/Mul_1_output_0", "outputIndexes": [ 2921 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_240_output_0", "outputIndexes": [ 2922 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921 ] , "main_type": "NONE", "name": "/Shape_422_output_0", "outputIndexes": [ 2923 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2923 ] , "main_type": "NONE", "name": "Shape12035", "outputIndexes": [ 2924 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2923 ] , "main_type": "NONE", "name": "Rank12037", "outputIndexes": [ 2925 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2925, 2925 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12039", "outputIndexes": [ 2926 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2926 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12040", "outputIndexes": [ 2927 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2926, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12042", "outputIndexes": [ 2928 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2928 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12043", "outputIndexes": [ 2929 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2924, 2927, 2929, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12046", "outputIndexes": [ 2930 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2930 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12047", "outputIndexes": [ 2931 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2931 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12048", "outputIndexes": [ 2932 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2932, 2931 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12049", "outputIndexes": [ 2933 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2923, 2933, 2926 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_458_output_0", "outputIndexes": [ 2934 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2934, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_90_output_0", "outputIndexes": [ 2935 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2935, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_967_output_0", "outputIndexes": [ 2936 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921, 2936, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_121_output_0", "outputIndexes": [ 2937 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2937 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_60_output_0", "outputIndexes": [ 2938 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2935, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_966_output_0", "outputIndexes": [ 2939 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2921, 22, 2939, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_120_output_0", "outputIndexes": [ 2940 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2938, 2940 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_393_output_0", "outputIndexes": [ 2941 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2941, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_241_output_0", "outputIndexes": [ 2942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2922, 2942 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_153_output_0", "outputIndexes": [ 2943 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4297 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1900221986, 1310742, 327680, 0, 0 ] } , "name": "/layers.30/self_attn/k_proj/Linear", "outputIndexes": [ 4302 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4302 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4303 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4303 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2944 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2908, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_962_output_0", "outputIndexes": [ 2945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_963_output_0", "outputIndexes": [ 2946 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2945, 2946, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_391_output_0", "outputIndexes": [ 2947 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2944, 2947 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_272_output_0", "outputIndexes": [ 2948 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2948 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1901860408, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_30/Mul_1_output_0", "outputIndexes": [ 2950 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_242_output_0", "outputIndexes": [ 2951 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950 ] , "main_type": "NONE", "name": "/Shape_423_output_0", "outputIndexes": [ 2952 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2952 ] , "main_type": "NONE", "name": "Shape11931", "outputIndexes": [ 2953 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2952 ] , "main_type": "NONE", "name": "Rank11933", "outputIndexes": [ 2954 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2954, 2954 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11935", "outputIndexes": [ 2955 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2955 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11936", "outputIndexes": [ 2956 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2955, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11938", "outputIndexes": [ 2957 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2957 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze11939", "outputIndexes": [ 2958 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2953, 2956, 2958, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice11942", "outputIndexes": [ 2959 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2959 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze11943", "outputIndexes": [ 2960 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 2960 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11944", "outputIndexes": [ 2961 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2961, 2960 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp11945", "outputIndexes": [ 2962 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2952, 2962, 2955 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_459_output_0", "outputIndexes": [ 2963 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2963, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_91_output_0", "outputIndexes": [ 2964 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2964, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_969_output_0", "outputIndexes": [ 2965 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950, 2965, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_123_output_0", "outputIndexes": [ 2966 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2966 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_61_output_0", "outputIndexes": [ 2967 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2964, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_968_output_0", "outputIndexes": [ 2968 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2950, 22, 2968, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_122_output_0", "outputIndexes": [ 2969 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2967, 2969 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_394_output_0", "outputIndexes": [ 2970 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2970, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_243_output_0", "outputIndexes": [ 2971 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2951, 2971 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_154_output_0", "outputIndexes": [ 2972 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4297 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1901861432, 1310742, 327680, 0, 0 ] } , "name": "/layers.30/self_attn/v_proj/Linear", "outputIndexes": [ 4306 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4306 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4307 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4307 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2973 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2908, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_964_output_0", "outputIndexes": [ 2974 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2916, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_965_output_0", "outputIndexes": [ 2975 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2974, 2975, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_392_output_0", "outputIndexes": [ 2976 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2973, 2976 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_273_output_0", "outputIndexes": [ 2977 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2943, 2972, 2977, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_278_output_0", "outputIndexes": [ 2978 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2978 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4308 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4308 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4309 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4309 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1903499854, 5242902, 1310720, 0, 0 ] } , "name": "/layers.30/self_attn/o_proj/Linear", "outputIndexes": [ 4310 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4310 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4311 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4311 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.30/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2979 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2895, 2979 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_156_output_0", "outputIndexes": [ 2980 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2980 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1910053476, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_30/Mul_1_output_0", "outputIndexes": [ 2981 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2981 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4312 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4312 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4313 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4313 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1910073956, 12451862, 3112960, 0, 0 ] } , "name": "/layers.30/mlp/gate_proj/Linear", "outputIndexes": [ 4314 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4314 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4315 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4315 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2982 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2982 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_30/Mul_output_0", "outputIndexes": [ 2983 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4313 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1925638778, 12451862, 3112960, 0, 0 ] } , "name": "/layers.30/mlp/up_proj/Linear", "outputIndexes": [ 4318 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4318 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4319 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4319 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2984 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2983, 2984 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_30/Mul_output_0", "outputIndexes": [ 2985 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2985 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4320 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4320 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.30/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4321 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4321 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1941203600, 12451862, 3112960, 0, 0 ] } , "name": "/layers.30/mlp/down_proj/Linear", "outputIndexes": [ 4322 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4322 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4323 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4323 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.30/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2986 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2980, 2986 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_157_output_0", "outputIndexes": [ 2987 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2987, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_279_output_0", "outputIndexes": [ 2988 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2988 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1956768422, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_31/Mul_1_output_0", "outputIndexes": [ 2989 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2989 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4324 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4324 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4325 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4325 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1956788902, 5242902, 1310720, 0, 0 ] } , "name": "/layers.31/self_attn/q_proj/Linear", "outputIndexes": [ 4326 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4326 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4327 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4327 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2990 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2989 ] , "main_type": "NONE", "name": "/Shape_434_output_0", "outputIndexes": [ 2991 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2991 ] , "main_type": "NONE", "name": "Shape12274", "outputIndexes": [ 2992 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2991 ] , "main_type": "NONE", "name": "Rank12276", "outputIndexes": [ 2993 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2993, 2993 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12278", "outputIndexes": [ 2994 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2994 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12279", "outputIndexes": [ 2995 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2994, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12281", "outputIndexes": [ 2996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2996 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12282", "outputIndexes": [ 2997 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2992, 2995, 2997, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12285", "outputIndexes": [ 2998 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2998 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12286", "outputIndexes": [ 2999 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2999, 2999 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12288", "outputIndexes": [ 3000 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2991, 3000, 2994 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_471_output_0", "outputIndexes": [ 3001 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3001, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_992_output_0", "outputIndexes": [ 3002 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2994 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12296", "outputIndexes": [ 3003 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2996 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12299", "outputIndexes": [ 3004 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2992, 3003, 3004, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12302", "outputIndexes": [ 3005 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3005 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12303", "outputIndexes": [ 3006 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3006 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12304", "outputIndexes": [ 3007 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3007, 3006 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12305", "outputIndexes": [ 3008 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2991, 3008, 2994 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_472_output_0", "outputIndexes": [ 3009 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_993_output_0", "outputIndexes": [ 3010 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3002, 3010, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_403_output_0", "outputIndexes": [ 3011 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2990, 3011 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_280_output_0", "outputIndexes": [ 3012 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3012 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1963342524, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_31/Mul_1_output_0", "outputIndexes": [ 3014 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3014, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_248_output_0", "outputIndexes": [ 3015 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3014 ] , "main_type": "NONE", "name": "/Shape_436_output_0", "outputIndexes": [ 3016 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3016 ] , "main_type": "NONE", "name": "Shape12424", "outputIndexes": [ 3017 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3016 ] , "main_type": "NONE", "name": "Rank12426", "outputIndexes": [ 3018 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3018, 3018 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12428", "outputIndexes": [ 3019 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3019 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12429", "outputIndexes": [ 3020 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3019, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12431", "outputIndexes": [ 3021 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3021 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12432", "outputIndexes": [ 3022 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3017, 3020, 3022, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12435", "outputIndexes": [ 3023 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3023 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12436", "outputIndexes": [ 3024 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3024 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12437", "outputIndexes": [ 3025 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3025, 3024 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12438", "outputIndexes": [ 3026 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3016, 3026, 3019 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_473_output_0", "outputIndexes": [ 3027 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3027, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_93_output_0", "outputIndexes": [ 3028 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3028, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_999_output_0", "outputIndexes": [ 3029 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3014, 3029, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_125_output_0", "outputIndexes": [ 3030 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3030 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_62_output_0", "outputIndexes": [ 3031 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3028, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_998_output_0", "outputIndexes": [ 3032 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3014, 22, 3032, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_124_output_0", "outputIndexes": [ 3033 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3031, 3033 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_406_output_0", "outputIndexes": [ 3034 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3034, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_249_output_0", "outputIndexes": [ 3035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3015, 3035 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_158_output_0", "outputIndexes": [ 3036 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4325 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1963343548, 1310742, 327680, 0, 0 ] } , "name": "/layers.31/self_attn/k_proj/Linear", "outputIndexes": [ 4330 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4330 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4331 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4331 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3037 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3001, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_994_output_0", "outputIndexes": [ 3038 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_995_output_0", "outputIndexes": [ 3039 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3038, 3039, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_404_output_0", "outputIndexes": [ 3040 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3037, 3040 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_281_output_0", "outputIndexes": [ 3041 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3041 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1964981970, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_31/Mul_1_output_0", "outputIndexes": [ 3043 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3043, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_250_output_0", "outputIndexes": [ 3044 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3043 ] , "main_type": "NONE", "name": "/Shape_437_output_0", "outputIndexes": [ 3045 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3045 ] , "main_type": "NONE", "name": "Shape12320", "outputIndexes": [ 3046 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3045 ] , "main_type": "NONE", "name": "Rank12322", "outputIndexes": [ 3047 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3047, 3047 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12324", "outputIndexes": [ 3048 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3048 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12325", "outputIndexes": [ 3049 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3048, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12327", "outputIndexes": [ 3050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3050 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12328", "outputIndexes": [ 3051 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3046, 3049, 3051, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12331", "outputIndexes": [ 3052 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3052 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12332", "outputIndexes": [ 3053 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3053 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12333", "outputIndexes": [ 3054 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3054, 3053 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12334", "outputIndexes": [ 3055 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3045, 3055, 3048 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_474_output_0", "outputIndexes": [ 3056 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3056, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_94_output_0", "outputIndexes": [ 3057 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3057, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1001_output_0", "outputIndexes": [ 3058 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3043, 3058, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_127_output_0", "outputIndexes": [ 3059 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3059 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_63_output_0", "outputIndexes": [ 3060 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3057, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1000_output_0", "outputIndexes": [ 3061 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3043, 22, 3061, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_126_output_0", "outputIndexes": [ 3062 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3060, 3062 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_407_output_0", "outputIndexes": [ 3063 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3063, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_251_output_0", "outputIndexes": [ 3064 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3044, 3064 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_159_output_0", "outputIndexes": [ 3065 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4325 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1964982994, 1310742, 327680, 0, 0 ] } , "name": "/layers.31/self_attn/v_proj/Linear", "outputIndexes": [ 4334 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4334 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4335 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4335 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3066 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3001, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_996_output_0", "outputIndexes": [ 3067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3009, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_997_output_0", "outputIndexes": [ 3068 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3067, 3068, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_405_output_0", "outputIndexes": [ 3069 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3066, 3069 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_282_output_0", "outputIndexes": [ 3070 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3036, 3065, 3070, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_287_output_0", "outputIndexes": [ 3071 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3071 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4336 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4336 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4337 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4337 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1966621416, 5242902, 1310720, 0, 0 ] } , "name": "/layers.31/self_attn/o_proj/Linear", "outputIndexes": [ 4338 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4338 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4339 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4339 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.31/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3072 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2988, 3072 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_161_output_0", "outputIndexes": [ 3073 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1973175038, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_31/Mul_1_output_0", "outputIndexes": [ 3074 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3074 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4340 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4340 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4341 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4341 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1973195518, 12451862, 3112960, 0, 0 ] } , "name": "/layers.31/mlp/gate_proj/Linear", "outputIndexes": [ 4342 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4342 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4343 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4343 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3075 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3075 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_31/Mul_output_0", "outputIndexes": [ 3076 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4341 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1988760340, 12451862, 3112960, 0, 0 ] } , "name": "/layers.31/mlp/up_proj/Linear", "outputIndexes": [ 4346 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4346 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4347 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4347 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3077 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3076, 3077 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_31/Mul_output_0", "outputIndexes": [ 3078 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3078 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4348 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4348 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.31/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4349 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4349 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2004325162, 12451862, 3112960, 0, 0 ] } , "name": "/layers.31/mlp/down_proj/Linear", "outputIndexes": [ 4350 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4350 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4351 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4351 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.31/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3079 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3073, 3079 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_162_output_0", "outputIndexes": [ 3080 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3080, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_288_output_0", "outputIndexes": [ 3081 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3081 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2019889984, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_32/Mul_1_output_0", "outputIndexes": [ 3082 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3082 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4352 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4352 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4353 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4353 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2019910464, 5242902, 1310720, 0, 0 ] } , "name": "/layers.32/self_attn/q_proj/Linear", "outputIndexes": [ 4354 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4354 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4355 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4355 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3083 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3082 ] , "main_type": "NONE", "name": "/Shape_448_output_0", "outputIndexes": [ 3084 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3084 ] , "main_type": "NONE", "name": "Shape12663", "outputIndexes": [ 3085 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3084 ] , "main_type": "NONE", "name": "Rank12665", "outputIndexes": [ 3086 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3086, 3086 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12667", "outputIndexes": [ 3087 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12668", "outputIndexes": [ 3088 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12670", "outputIndexes": [ 3089 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3089 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12671", "outputIndexes": [ 3090 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3085, 3088, 3090, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12674", "outputIndexes": [ 3091 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3091 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12675", "outputIndexes": [ 3092 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3092, 3092 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12677", "outputIndexes": [ 3093 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084, 3093, 3087 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_486_output_0", "outputIndexes": [ 3094 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1024_output_0", "outputIndexes": [ 3095 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3087 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12685", "outputIndexes": [ 3096 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3089 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12688", "outputIndexes": [ 3097 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3085, 3096, 3097, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12691", "outputIndexes": [ 3098 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3098 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12692", "outputIndexes": [ 3099 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3099 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12693", "outputIndexes": [ 3100 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3100, 3099 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12694", "outputIndexes": [ 3101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3084, 3101, 3087 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_487_output_0", "outputIndexes": [ 3102 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1025_output_0", "outputIndexes": [ 3103 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3095, 3103, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_416_output_0", "outputIndexes": [ 3104 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3083, 3104 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_289_output_0", "outputIndexes": [ 3105 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3105 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2026464086, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_32/Mul_1_output_0", "outputIndexes": [ 3107 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_256_output_0", "outputIndexes": [ 3108 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107 ] , "main_type": "NONE", "name": "/Shape_450_output_0", "outputIndexes": [ 3109 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3109 ] , "main_type": "NONE", "name": "Shape12813", "outputIndexes": [ 3110 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3109 ] , "main_type": "NONE", "name": "Rank12815", "outputIndexes": [ 3111 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3111, 3111 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12817", "outputIndexes": [ 3112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12818", "outputIndexes": [ 3113 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3112, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12820", "outputIndexes": [ 3114 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3114 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12821", "outputIndexes": [ 3115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3110, 3113, 3115, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12824", "outputIndexes": [ 3116 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3116 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12825", "outputIndexes": [ 3117 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3117 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12826", "outputIndexes": [ 3118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3118, 3117 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12827", "outputIndexes": [ 3119 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3109, 3119, 3112 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_488_output_0", "outputIndexes": [ 3120 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3120, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_96_output_0", "outputIndexes": [ 3121 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3121, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1031_output_0", "outputIndexes": [ 3122 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107, 3122, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_129_output_0", "outputIndexes": [ 3123 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3123 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_64_output_0", "outputIndexes": [ 3124 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3121, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1030_output_0", "outputIndexes": [ 3125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3107, 22, 3125, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_128_output_0", "outputIndexes": [ 3126 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3124, 3126 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_419_output_0", "outputIndexes": [ 3127 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3127, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_257_output_0", "outputIndexes": [ 3128 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3108, 3128 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_163_output_0", "outputIndexes": [ 3129 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4353 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2026465110, 1310742, 327680, 0, 0 ] } , "name": "/layers.32/self_attn/k_proj/Linear", "outputIndexes": [ 4358 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4358 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4359 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4359 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3130 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1026_output_0", "outputIndexes": [ 3131 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1027_output_0", "outputIndexes": [ 3132 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3131, 3132, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_417_output_0", "outputIndexes": [ 3133 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3130, 3133 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_290_output_0", "outputIndexes": [ 3134 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3134 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2028103532, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_32/Mul_1_output_0", "outputIndexes": [ 3136 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_258_output_0", "outputIndexes": [ 3137 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136 ] , "main_type": "NONE", "name": "/Shape_451_output_0", "outputIndexes": [ 3138 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3138 ] , "main_type": "NONE", "name": "Shape12709", "outputIndexes": [ 3139 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3138 ] , "main_type": "NONE", "name": "Rank12711", "outputIndexes": [ 3140 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3140, 3140 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12713", "outputIndexes": [ 3141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3141 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12714", "outputIndexes": [ 3142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3141, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12716", "outputIndexes": [ 3143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze12717", "outputIndexes": [ 3144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3139, 3142, 3144, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice12720", "outputIndexes": [ 3145 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3145 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze12721", "outputIndexes": [ 3146 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3146 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12722", "outputIndexes": [ 3147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3147, 3146 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp12723", "outputIndexes": [ 3148 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3138, 3148, 3141 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_489_output_0", "outputIndexes": [ 3149 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3149, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_97_output_0", "outputIndexes": [ 3150 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1033_output_0", "outputIndexes": [ 3151 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136, 3151, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_131_output_0", "outputIndexes": [ 3152 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3152 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_65_output_0", "outputIndexes": [ 3153 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3150, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1032_output_0", "outputIndexes": [ 3154 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3136, 22, 3154, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_130_output_0", "outputIndexes": [ 3155 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3153, 3155 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_420_output_0", "outputIndexes": [ 3156 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3156, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_259_output_0", "outputIndexes": [ 3157 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3137, 3157 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_164_output_0", "outputIndexes": [ 3158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4353 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2028104556, 1310742, 327680, 0, 0 ] } , "name": "/layers.32/self_attn/v_proj/Linear", "outputIndexes": [ 4362 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4362 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4363 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4363 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3159 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3094, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1028_output_0", "outputIndexes": [ 3160 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3102, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1029_output_0", "outputIndexes": [ 3161 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3160, 3161, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_418_output_0", "outputIndexes": [ 3162 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3159, 3162 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_291_output_0", "outputIndexes": [ 3163 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3129, 3158, 3163, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_296_output_0", "outputIndexes": [ 3164 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3164 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4364 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4364 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4365 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4365 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2029742978, 5242902, 1310720, 0, 0 ] } , "name": "/layers.32/self_attn/o_proj/Linear", "outputIndexes": [ 4366 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4366 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4367 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4367 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.32/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3165 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3081, 3165 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_166_output_0", "outputIndexes": [ 3166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3166 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2036296600, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_32/Mul_1_output_0", "outputIndexes": [ 3167 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3167 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4368 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4368 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4369 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4369 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2036317080, 12451862, 3112960, 0, 0 ] } , "name": "/layers.32/mlp/gate_proj/Linear", "outputIndexes": [ 4370 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4370 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4371 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4371 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3168 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3168 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_32/Mul_output_0", "outputIndexes": [ 3169 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4369 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2051881902, 12451862, 3112960, 0, 0 ] } , "name": "/layers.32/mlp/up_proj/Linear", "outputIndexes": [ 4374 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4374 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4375 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4375 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3170 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3169, 3170 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_32/Mul_output_0", "outputIndexes": [ 3171 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3171 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4376 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4376 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.32/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4377 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4377 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2067446724, 12451862, 3112960, 0, 0 ] } , "name": "/layers.32/mlp/down_proj/Linear", "outputIndexes": [ 4378 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4378 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.32/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4379 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4379 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.32/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3172 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3166, 3172 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_167_output_0", "outputIndexes": [ 3173 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3173, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_297_output_0", "outputIndexes": [ 3174 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2083011546, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_33/Mul_1_output_0", "outputIndexes": [ 3175 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3175 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4380 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4380 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4381 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4381 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2083032026, 5242902, 1310720, 0, 0 ] } , "name": "/layers.33/self_attn/q_proj/Linear", "outputIndexes": [ 4382 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4382 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4383 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4383 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3176 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3175 ] , "main_type": "NONE", "name": "/Shape_462_output_0", "outputIndexes": [ 3177 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3177 ] , "main_type": "NONE", "name": "Shape13052", "outputIndexes": [ 3178 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3177 ] , "main_type": "NONE", "name": "Rank13054", "outputIndexes": [ 3179 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3179, 3179 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13056", "outputIndexes": [ 3180 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13057", "outputIndexes": [ 3181 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13059", "outputIndexes": [ 3182 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3182 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13060", "outputIndexes": [ 3183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3178, 3181, 3183, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13063", "outputIndexes": [ 3184 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3184 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13064", "outputIndexes": [ 3185 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3185, 3185 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13066", "outputIndexes": [ 3186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3177, 3186, 3180 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_501_output_0", "outputIndexes": [ 3187 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3187, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1056_output_0", "outputIndexes": [ 3188 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3180 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13074", "outputIndexes": [ 3189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3182 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13077", "outputIndexes": [ 3190 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3178, 3189, 3190, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13080", "outputIndexes": [ 3191 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3191 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13081", "outputIndexes": [ 3192 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3192 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13082", "outputIndexes": [ 3193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3193, 3192 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13083", "outputIndexes": [ 3194 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3177, 3194, 3180 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_502_output_0", "outputIndexes": [ 3195 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1057_output_0", "outputIndexes": [ 3196 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3188, 3196, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_429_output_0", "outputIndexes": [ 3197 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3176, 3197 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_298_output_0", "outputIndexes": [ 3198 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3198 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2089585648, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_33/Mul_1_output_0", "outputIndexes": [ 3200 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3200, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_264_output_0", "outputIndexes": [ 3201 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3200 ] , "main_type": "NONE", "name": "/Shape_464_output_0", "outputIndexes": [ 3202 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3202 ] , "main_type": "NONE", "name": "Shape13202", "outputIndexes": [ 3203 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3202 ] , "main_type": "NONE", "name": "Rank13204", "outputIndexes": [ 3204 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3204, 3204 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13206", "outputIndexes": [ 3205 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3205 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13207", "outputIndexes": [ 3206 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3205, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13209", "outputIndexes": [ 3207 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3207 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13210", "outputIndexes": [ 3208 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3203, 3206, 3208, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13213", "outputIndexes": [ 3209 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3209 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13214", "outputIndexes": [ 3210 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3210 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13215", "outputIndexes": [ 3211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3211, 3210 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13216", "outputIndexes": [ 3212 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3202, 3212, 3205 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_503_output_0", "outputIndexes": [ 3213 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3213, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_99_output_0", "outputIndexes": [ 3214 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1063_output_0", "outputIndexes": [ 3215 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3200, 3215, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_133_output_0", "outputIndexes": [ 3216 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3216 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_66_output_0", "outputIndexes": [ 3217 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3214, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1062_output_0", "outputIndexes": [ 3218 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3200, 22, 3218, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_132_output_0", "outputIndexes": [ 3219 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3217, 3219 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_432_output_0", "outputIndexes": [ 3220 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3220, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_265_output_0", "outputIndexes": [ 3221 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3201, 3221 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_168_output_0", "outputIndexes": [ 3222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4381 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2089586672, 1310742, 327680, 0, 0 ] } , "name": "/layers.33/self_attn/k_proj/Linear", "outputIndexes": [ 4386 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4386 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4387 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4387 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3223 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3187, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1058_output_0", "outputIndexes": [ 3224 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1059_output_0", "outputIndexes": [ 3225 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3224, 3225, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_430_output_0", "outputIndexes": [ 3226 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3223, 3226 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_299_output_0", "outputIndexes": [ 3227 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3227 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2091225094, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_33/Mul_1_output_0", "outputIndexes": [ 3229 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_266_output_0", "outputIndexes": [ 3230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229 ] , "main_type": "NONE", "name": "/Shape_465_output_0", "outputIndexes": [ 3231 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3231 ] , "main_type": "NONE", "name": "Shape13098", "outputIndexes": [ 3232 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3231 ] , "main_type": "NONE", "name": "Rank13100", "outputIndexes": [ 3233 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3233, 3233 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13102", "outputIndexes": [ 3234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13103", "outputIndexes": [ 3235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3234, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13105", "outputIndexes": [ 3236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3236 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13106", "outputIndexes": [ 3237 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3232, 3235, 3237, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13109", "outputIndexes": [ 3238 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3238 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13110", "outputIndexes": [ 3239 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3239 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13111", "outputIndexes": [ 3240 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3240, 3239 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13112", "outputIndexes": [ 3241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3231, 3241, 3234 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_504_output_0", "outputIndexes": [ 3242 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3242, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_100_output_0", "outputIndexes": [ 3243 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1065_output_0", "outputIndexes": [ 3244 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229, 3244, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_135_output_0", "outputIndexes": [ 3245 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3245 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_67_output_0", "outputIndexes": [ 3246 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3243, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1064_output_0", "outputIndexes": [ 3247 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3229, 22, 3247, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_134_output_0", "outputIndexes": [ 3248 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3246, 3248 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_433_output_0", "outputIndexes": [ 3249 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3249, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_267_output_0", "outputIndexes": [ 3250 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3230, 3250 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_169_output_0", "outputIndexes": [ 3251 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4381 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2091226118, 1310742, 327680, 0, 0 ] } , "name": "/layers.33/self_attn/v_proj/Linear", "outputIndexes": [ 4390 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4390 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4391 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4391 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3252 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3187, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1060_output_0", "outputIndexes": [ 3253 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3195, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1061_output_0", "outputIndexes": [ 3254 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3253, 3254, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_431_output_0", "outputIndexes": [ 3255 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3252, 3255 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_300_output_0", "outputIndexes": [ 3256 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3222, 3251, 3256, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_305_output_0", "outputIndexes": [ 3257 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3257 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4392 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4392 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4393 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4393 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2092864540, 5242902, 1310720, 0, 0 ] } , "name": "/layers.33/self_attn/o_proj/Linear", "outputIndexes": [ 4394 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4394 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4395 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4395 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.33/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3258 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3174, 3258 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_171_output_0", "outputIndexes": [ 3259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3259 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2099418162, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_33/Mul_1_output_0", "outputIndexes": [ 3260 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3260 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4396 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4396 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4397 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4397 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2099438642, 12451862, 3112960, 0, 0 ] } , "name": "/layers.33/mlp/gate_proj/Linear", "outputIndexes": [ 4398 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4398 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4399 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4399 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3261 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3261 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_33/Mul_output_0", "outputIndexes": [ 3262 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4397 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2115003464, 12451862, 3112960, 0, 0 ] } , "name": "/layers.33/mlp/up_proj/Linear", "outputIndexes": [ 4402 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4402 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4403 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4403 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3263 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3262, 3263 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_33/Mul_output_0", "outputIndexes": [ 3264 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3264 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4404 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4404 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.33/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4405 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4405 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2130568286, 12451862, 3112960, 0, 0 ] } , "name": "/layers.33/mlp/down_proj/Linear", "outputIndexes": [ 4406 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4406 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.33/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4407 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4407 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.33/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3265 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3259, 3265 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_172_output_0", "outputIndexes": [ 3266 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3266, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_306_output_0", "outputIndexes": [ 3267 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3267 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2146133108, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_34/Mul_1_output_0", "outputIndexes": [ 3268 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3268 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4408 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4408 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4409 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4409 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2146153588, 5242902, 1310720, 0, 0 ] } , "name": "/layers.34/self_attn/q_proj/Linear", "outputIndexes": [ 4410 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4410 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4411 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4411 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3269 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3268 ] , "main_type": "NONE", "name": "/Shape_476_output_0", "outputIndexes": [ 3270 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3270 ] , "main_type": "NONE", "name": "Shape13441", "outputIndexes": [ 3271 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3270 ] , "main_type": "NONE", "name": "Rank13443", "outputIndexes": [ 3272 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3272, 3272 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13445", "outputIndexes": [ 3273 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3273 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13446", "outputIndexes": [ 3274 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3273, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13448", "outputIndexes": [ 3275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3275 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13449", "outputIndexes": [ 3276 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3271, 3274, 3276, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13452", "outputIndexes": [ 3277 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3277 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13453", "outputIndexes": [ 3278 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3278, 3278 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13455", "outputIndexes": [ 3279 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3270, 3279, 3273 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_516_output_0", "outputIndexes": [ 3280 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1088_output_0", "outputIndexes": [ 3281 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3273 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13463", "outputIndexes": [ 3282 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3275 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13466", "outputIndexes": [ 3283 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3271, 3282, 3283, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13469", "outputIndexes": [ 3284 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3284 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13470", "outputIndexes": [ 3285 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3285 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13471", "outputIndexes": [ 3286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3286, 3285 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13472", "outputIndexes": [ 3287 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3270, 3287, 3273 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_517_output_0", "outputIndexes": [ 3288 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1089_output_0", "outputIndexes": [ 3289 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3281, 3289, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_442_output_0", "outputIndexes": [ 3290 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3269, 3290 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_307_output_0", "outputIndexes": [ 3291 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3291 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2152707210, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_34/Mul_1_output_0", "outputIndexes": [ 3293 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3293, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_272_output_0", "outputIndexes": [ 3294 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3293 ] , "main_type": "NONE", "name": "/Shape_478_output_0", "outputIndexes": [ 3295 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3295 ] , "main_type": "NONE", "name": "Shape13591", "outputIndexes": [ 3296 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3295 ] , "main_type": "NONE", "name": "Rank13593", "outputIndexes": [ 3297 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3297, 3297 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13595", "outputIndexes": [ 3298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13596", "outputIndexes": [ 3299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3298, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13598", "outputIndexes": [ 3300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13599", "outputIndexes": [ 3301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3296, 3299, 3301, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13602", "outputIndexes": [ 3302 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3302 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13603", "outputIndexes": [ 3303 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3303 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13604", "outputIndexes": [ 3304 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3304, 3303 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13605", "outputIndexes": [ 3305 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3295, 3305, 3298 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_518_output_0", "outputIndexes": [ 3306 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3306, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_102_output_0", "outputIndexes": [ 3307 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3307, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1095_output_0", "outputIndexes": [ 3308 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3293, 3308, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_137_output_0", "outputIndexes": [ 3309 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3309 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_68_output_0", "outputIndexes": [ 3310 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3307, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1094_output_0", "outputIndexes": [ 3311 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3293, 22, 3311, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_136_output_0", "outputIndexes": [ 3312 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3310, 3312 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_445_output_0", "outputIndexes": [ 3313 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3313, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_273_output_0", "outputIndexes": [ 3314 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3294, 3314 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_173_output_0", "outputIndexes": [ 3315 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4409 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2152708234, 1310742, 327680, 0, 0 ] } , "name": "/layers.34/self_attn/k_proj/Linear", "outputIndexes": [ 4414 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4414 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4415 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4415 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3316 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1090_output_0", "outputIndexes": [ 3317 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1091_output_0", "outputIndexes": [ 3318 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3317, 3318, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_443_output_0", "outputIndexes": [ 3319 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3316, 3319 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_308_output_0", "outputIndexes": [ 3320 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3320 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2154346656, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_34/Mul_1_output_0", "outputIndexes": [ 3322 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_274_output_0", "outputIndexes": [ 3323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322 ] , "main_type": "NONE", "name": "/Shape_479_output_0", "outputIndexes": [ 3324 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3324 ] , "main_type": "NONE", "name": "Shape13487", "outputIndexes": [ 3325 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3324 ] , "main_type": "NONE", "name": "Rank13489", "outputIndexes": [ 3326 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3326, 3326 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13491", "outputIndexes": [ 3327 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3327 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13492", "outputIndexes": [ 3328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3327, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13494", "outputIndexes": [ 3329 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3329 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13495", "outputIndexes": [ 3330 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3325, 3328, 3330, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13498", "outputIndexes": [ 3331 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3331 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13499", "outputIndexes": [ 3332 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3332 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13500", "outputIndexes": [ 3333 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3333, 3332 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13501", "outputIndexes": [ 3334 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3324, 3334, 3327 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_519_output_0", "outputIndexes": [ 3335 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3335, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_103_output_0", "outputIndexes": [ 3336 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1097_output_0", "outputIndexes": [ 3337 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322, 3337, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_139_output_0", "outputIndexes": [ 3338 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3338 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_69_output_0", "outputIndexes": [ 3339 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3336, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1096_output_0", "outputIndexes": [ 3340 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3322, 22, 3340, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_138_output_0", "outputIndexes": [ 3341 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3339, 3341 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_446_output_0", "outputIndexes": [ 3342 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3342, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_275_output_0", "outputIndexes": [ 3343 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3323, 3343 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_174_output_0", "outputIndexes": [ 3344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4409 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2154347680, 1310742, 327680, 0, 0 ] } , "name": "/layers.34/self_attn/v_proj/Linear", "outputIndexes": [ 4418 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4418 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4419 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4419 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3345 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3280, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1092_output_0", "outputIndexes": [ 3346 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3288, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1093_output_0", "outputIndexes": [ 3347 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3346, 3347, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_444_output_0", "outputIndexes": [ 3348 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3345, 3348 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_309_output_0", "outputIndexes": [ 3349 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3315, 3344, 3349, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_314_output_0", "outputIndexes": [ 3350 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3350 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4420 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4420 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4421 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4421 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2155986102, 5242902, 1310720, 0, 0 ] } , "name": "/layers.34/self_attn/o_proj/Linear", "outputIndexes": [ 4422 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4422 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4423 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4423 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.34/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3351 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3267, 3351 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_176_output_0", "outputIndexes": [ 3352 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3352 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2162539724, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_34/Mul_1_output_0", "outputIndexes": [ 3353 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3353 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4424 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4424 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4425 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4425 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2162560204, 12451862, 3112960, 0, 0 ] } , "name": "/layers.34/mlp/gate_proj/Linear", "outputIndexes": [ 4426 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4426 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4427 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4427 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3354 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3354 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_34/Mul_output_0", "outputIndexes": [ 3355 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4425 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2178125026, 12451862, 3112960, 0, 0 ] } , "name": "/layers.34/mlp/up_proj/Linear", "outputIndexes": [ 4430 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4430 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4431 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4431 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3356 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3355, 3356 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_34/Mul_output_0", "outputIndexes": [ 3357 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3357 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4432 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4432 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.34/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4433 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4433 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2193689848, 12451862, 3112960, 0, 0 ] } , "name": "/layers.34/mlp/down_proj/Linear", "outputIndexes": [ 4434 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4434 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.34/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4435 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4435 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.34/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3358 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3352, 3358 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_177_output_0", "outputIndexes": [ 3359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3359, 5 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_315_output_0", "outputIndexes": [ 3360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2209254670, 10240, 10240 ] , "useRMSNorm": true } , "name": "/input_layernorm_35/Mul_1_output_0", "outputIndexes": [ 3361 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3361 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 4436 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4436 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 4437 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4437 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4096, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2209275150, 5242902, 1310720, 0, 0 ] } , "name": "/layers.35/self_attn/q_proj/Linear", "outputIndexes": [ 4438 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4438 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 4439 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4439 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4096 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 3362 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3361 ] , "main_type": "NONE", "name": "/Shape_490_output_0", "outputIndexes": [ 3363 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3363 ] , "main_type": "NONE", "name": "Shape13830", "outputIndexes": [ 3364 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3363 ] , "main_type": "NONE", "name": "Rank13832", "outputIndexes": [ 3365 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3365, 3365 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13834", "outputIndexes": [ 3366 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3366 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13835", "outputIndexes": [ 3367 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3366, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13837", "outputIndexes": [ 3368 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13838", "outputIndexes": [ 3369 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364, 3367, 3369, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13841", "outputIndexes": [ 3370 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3370 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13842", "outputIndexes": [ 3371 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3371, 3371 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13844", "outputIndexes": [ 3372 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3363, 3372, 3366 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_531_output_0", "outputIndexes": [ 3373 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3373, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1120_output_0", "outputIndexes": [ 3374 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3366 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13852", "outputIndexes": [ 3375 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3368 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13855", "outputIndexes": [ 3376 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3364, 3375, 3376, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13858", "outputIndexes": [ 3377 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3377 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13859", "outputIndexes": [ 3378 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 14, 3378 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13860", "outputIndexes": [ 3379 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3379, 3378 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13861", "outputIndexes": [ 3380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3363, 3380, 3366 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_532_output_0", "outputIndexes": [ 3381 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3381, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1121_output_0", "outputIndexes": [ 3382 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3374, 3382, 32, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_455_output_0", "outputIndexes": [ 3383 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3362, 3383 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_316_output_0", "outputIndexes": [ 3384 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3384 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2215828772, 512, 512 ] , "useRMSNorm": true } , "name": "/q_norm_35/Mul_1_output_0", "outputIndexes": [ 3386 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_280_output_0", "outputIndexes": [ 3387 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386 ] , "main_type": "NONE", "name": "/Shape_492_output_0", "outputIndexes": [ 3388 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3388 ] , "main_type": "NONE", "name": "Shape13948", "outputIndexes": [ 3389 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3388 ] , "main_type": "NONE", "name": "Rank13950", "outputIndexes": [ 3390 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3390, 3390 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13952", "outputIndexes": [ 3391 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13953", "outputIndexes": [ 3392 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3391, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13955", "outputIndexes": [ 3393 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3393 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13956", "outputIndexes": [ 3394 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3389, 3392, 3394, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13959", "outputIndexes": [ 3395 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3395 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13960", "outputIndexes": [ 3396 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3396 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13961", "outputIndexes": [ 3397 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3397, 3396 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13962", "outputIndexes": [ 3398 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3388, 3398, 3391 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_533_output_0", "outputIndexes": [ 3399 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3399, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_105_output_0", "outputIndexes": [ 3400 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3400, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1127_output_0", "outputIndexes": [ 3401 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386, 3401, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_141_output_0", "outputIndexes": [ 3402 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3402 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_70_output_0", "outputIndexes": [ 3403 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3400, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1126_output_0", "outputIndexes": [ 3404 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3386, 22, 3404, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_140_output_0", "outputIndexes": [ 3405 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3403, 3405 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_458_output_0", "outputIndexes": [ 3406 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3406, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_281_output_0", "outputIndexes": [ 3407 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3387, 3407 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_178_output_0", "outputIndexes": [ 3408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4437 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2215829796, 1310742, 327680, 0, 0 ] } , "name": "/layers.35/self_attn/k_proj/Linear", "outputIndexes": [ 4442 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4442 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 4443 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4443 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 3409 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3373, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1122_output_0", "outputIndexes": [ 3410 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3381, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1123_output_0", "outputIndexes": [ 3411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3410, 3411, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_456_output_0", "outputIndexes": [ 3412 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3409, 3412 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_317_output_0", "outputIndexes": [ 3413 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3413 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2217468218, 512, 512 ] , "useRMSNorm": true } , "name": "/k_norm_35/Mul_1_output_0", "outputIndexes": [ 3415 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415, 91 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_282_output_0", "outputIndexes": [ 3416 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415 ] , "main_type": "NONE", "name": "/Shape_493_output_0", "outputIndexes": [ 3417 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3417 ] , "main_type": "NONE", "name": "Shape13876", "outputIndexes": [ 3418 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 3417 ] , "main_type": "NONE", "name": "Rank13878", "outputIndexes": [ 3419 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3419, 3419 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13880", "outputIndexes": [ 3420 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3420 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13881", "outputIndexes": [ 3421 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3420, 14 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13883", "outputIndexes": [ 3422 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3422 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze13884", "outputIndexes": [ 3423 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3418, 3421, 3423, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice13887", "outputIndexes": [ 3424 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3424 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze13888", "outputIndexes": [ 3425 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 94, 3425 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13889", "outputIndexes": [ 3426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3426, 3425 ] , "main_type": "BinaryOp", "main": { "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp13890", "outputIndexes": [ 3427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3417, 3427, 3420 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_534_output_0", "outputIndexes": [ 3428 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3428, 62 ] , "main_type": "BinaryOp", "main": { "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_106_output_0", "outputIndexes": [ 3429 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3429, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1129_output_0", "outputIndexes": [ 3430 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415, 3430, 108, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_143_output_0", "outputIndexes": [ 3431 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3431 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_71_output_0", "outputIndexes": [ 3432 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3429, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1128_output_0", "outputIndexes": [ 3433 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3415, 22, 3433, 109, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_142_output_0", "outputIndexes": [ 3434 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3432, 3434 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_459_output_0", "outputIndexes": [ 3435 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3435, 121 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_283_output_0", "outputIndexes": [ 3436 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3416, 3436 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_179_output_0", "outputIndexes": [ 3437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4437 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 40960, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2217469242, 1310742, 327680, 0, 0 ] } , "name": "/layers.35/self_attn/v_proj/Linear", "outputIndexes": [ 4446 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4446 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 4447 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4447 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1024 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 3438 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3373, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1124_output_0", "outputIndexes": [ 3439 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3381, 22 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1125_output_0", "outputIndexes": [ 3440 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3439, 3440, 127, 33 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_457_output_0", "outputIndexes": [ 3441 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3438, 3441 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_318_output_0", "outputIndexes": [ 3442 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3408, 3437, 3442, 159 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_323_output_0", "outputIndexes": [ 3443 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3443 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4096, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 4448 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4448 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 4449 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4449 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 4096, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 163840, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2219107664, 5242902, 1310720, 0, 0 ] } , "name": "/layers.35/self_attn/o_proj/Linear", "outputIndexes": [ 4450 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4450 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 4451 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4451 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.35/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 3444 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3360, 3444 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_181_output_0", "outputIndexes": [ 3445 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3445 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2225661286, 10240, 10240 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_35/Mul_1_output_0", "outputIndexes": [ 3446 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3446 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 4452 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4452 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 4453 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4453 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2225681766, 12451862, 3112960, 0, 0 ] } , "name": "/layers.35/mlp/gate_proj/Linear", "outputIndexes": [ 4454 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4454 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 4455 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4455 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 3447 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3447 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_35/Mul_output_0", "outputIndexes": [ 3448 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4453 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 9728, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2241246588, 12451862, 3112960, 0, 0 ] } , "name": "/layers.35/mlp/up_proj/Linear", "outputIndexes": [ 4458 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4458 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 4459 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4459 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 9728 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 3449 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3448, 3449 ] , "main_type": "BinaryOp", "main": { "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_35/Mul_output_0", "outputIndexes": [ 3450 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3450 ] , "main_type": "Reshape", "main": { "dims": [ -1, 9728, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 4460 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4460 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.35/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 4461 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4461 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 2560, "inputCount": 9728, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 389120, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2256811410, 12451862, 3112960, 0, 0 ] } , "name": "/layers.35/mlp/down_proj/Linear", "outputIndexes": [ 4462 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4462 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.35/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 4463 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4463 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 2560 ] , "dimType": "NCHW" } , "name": "/layers.35/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 3451 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3445, 3451 ] , "main_type": "BinaryOp", "main": { "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_182_output_0", "outputIndexes": [ 3452 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3452, 3, 108, 17, 17 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_144_output_0", "outputIndexes": [ 3453 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3453 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 2272376232, 10240, 10240 ] , "useRMSNorm": true } , "name": "hidden_states", "outputIndexes": [ 3454 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 3454 ] , "main_type": "Reshape", "main": { "dims": [ -1, 2560, 1, 1 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": [ 4464 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4464 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": [ 4465 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4465 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 151936, "inputCount": 2560, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6077440, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } , "external": [ 2272396712, 388956426, 48619520, 0, 0 ] } , "name": "/lm/lm_head/Linear", "outputIndexes": [ 4466 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4466 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": [ 4467 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4467 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 151936 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": [ 3455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } ] , "outputName": [ "logits", "hidden_states", "presents" ] , "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": [ "past_key_values", "presents", "position_ids", "logits_index", "input_ids", "/Constant_output_0", "/Reshape_output_0", "/input_layernorm/Mul_1_output_0", "/FakeLinear_output_0", "/Shape_output_0", "Shape52", "Rank54", "BinaryOp56", "Unsqueeze57", "Const9", "BinaryOp59", "Unsqueeze60", "Unsqueeze62", "StridedSlice63", "Squeeze64", "BinaryOp66", "/Gather_1_output_0", "/rotary/Constant_8_output_0", "/Unsqueeze_output_0", "Unsqueeze76", "Unsqueeze79", "StridedSlice82", "Squeeze83", "BinaryOp84", "BinaryOp85", "/Gather_2_output_0", "/Unsqueeze_1_output_0", "/Constant_4_output_0", "/Constant_5_output_0", "/Concat_output_0", "/Reshape_1_output_0", "/q_norm/Cast_output_0", "/q_norm/Mul_1_output_0", "/rotary/Cast_output_0", "/rotary/Constant_1_output_0", "/rotary/Unsqueeze_output_0", "Shape104", "Rank106", "BinaryOp108", "Unsqueeze109", "BinaryOp111", "Unsqueeze112", "StridedSlice115", "Squeeze116", "BinaryOp118", "/rotary/Gather_output_0", "/rotary/Constant_3_output_0", "/rotary/Mul_output_0", "Unsqueeze127", "Unsqueeze130", "StridedSlice133", "Squeeze134", "BinaryOp135", "BinaryOp136", "/rotary/Gather_1_output_0", "/rotary/Constant_5_output_0", "/rotary/Mul_1_output_0", "/rotary/Constant_6_output_0", "Unsqueeze146", "Unsqueeze149", "StridedSlice152", "Squeeze153", "BinaryOp154", "BinaryOp155", "/rotary/Gather_2_output_0", "/rotary/Constant_7_output_0", "/rotary/Mul_2_output_0", "/rotary/Concat_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Concat_1_output_0", "/rotary/Concat_2_output_0", "/rotary/Constant_10_output_0", "/rotary/Unsqueeze_3_output_0", "/rotary/Unsqueeze_4_output_0", "Shape170", "Rank172", "BinaryOp174", "Unsqueeze175", "BinaryOp177", "Unsqueeze178", "StridedSlice181", "Squeeze182", "BinaryOp184", "/Gather_3_output_0", "/Mul_output_0", "/Shape_2_output_0", "/Constant_11_output_0", "Shape311", "Rank313", "BinaryOp315", "Unsqueeze316", "BinaryOp318", "Unsqueeze319", "StridedSlice322", "Squeeze323", "BinaryOp324", "BinaryOp325", "/Gather_5_output_0", "/Div_output_0", "/Unsqueeze_7_output_0", "/Constant_20_output_0", "/Constant_14_output_0", "/Slice_1_output_0", "/Neg_output_0", "/Unsqueeze_6_output_0", "/Slice_output_0", "/Concat_3_output_0", "Unsqueeze220", "Unsqueeze223", "StridedSlice226", "Squeeze227", "BinaryOp228", "BinaryOp229", "/Gather_4_output_0", "/Mul_1_output_0", "/Add_output_0", "/FakeLinear_1_output_0", "/Unsqueeze_2_output_0", "/Unsqueeze_3_output_0", "/Constant_7_output_0", "/Concat_1_output_0", "/Reshape_2_output_0", "/k_norm/Cast_output_0", "/k_norm/Mul_1_output_0", "/Mul_2_output_0", "/Shape_3_output_0", "Shape189", "Rank191", "BinaryOp193", "Unsqueeze194", "BinaryOp196", "Unsqueeze197", "StridedSlice200", "Squeeze201", "BinaryOp202", "BinaryOp203", "/Gather_6_output_0", "/Div_1_output_0", "/Unsqueeze_9_output_0", "/Slice_3_output_0", "/Neg_1_output_0", "/Unsqueeze_8_output_0", "/Slice_2_output_0", "/Concat_4_output_0", "/Mul_3_output_0", "/Add_1_output_0", "/FakeLinear_2_output_0", "/Unsqueeze_4_output_0", "/Unsqueeze_5_output_0", "/Concat_2_output_0", "/Reshape_3_output_0", "attention_mask", "/Reshape_8_output_0", "/FakeLinear_3_output_0", "/Add_3_output_0", "/post_attention_layernorm/Mul_1_output_0", "/mlp/gate_proj/FakeLinear_output_0", "/mlp/act_fn/Mul_output_0", "/mlp/up_proj/FakeLinear_output_0", "/mlp/Mul_output_0", "/mlp/down_proj/FakeLinear_output_0", "/Add_4_output_0", "deepstack_embeds", "Shape546", "Rank548", "BinaryOp550", "Unsqueeze551", "BinaryOp553", "Unsqueeze554", "StridedSlice557", "Squeeze558", "BinaryOp560", "/Gather_17_output_0", "/Add_5_output_0", "/Reshape_9_output_0", "/input_layernorm_1/Mul_1_output_0", "/FakeLinear_4_output_0", "/Shape_14_output_0", "Shape573", "Rank575", "BinaryOp577", "Unsqueeze578", "BinaryOp580", "Unsqueeze581", "StridedSlice584", "Squeeze585", "BinaryOp587", "/Gather_19_output_0", "/Unsqueeze_32_output_0", "Unsqueeze595", "Unsqueeze598", "StridedSlice601", "Squeeze602", "BinaryOp603", "BinaryOp604", "/Gather_20_output_0", "/Unsqueeze_33_output_0", "/Concat_13_output_0", "/Reshape_10_output_0", "/q_norm_1/Cast_output_0", "/q_norm_1/Mul_1_output_0", "/Mul_8_output_0", "/Shape_16_output_0", "Shape722", "Rank724", "BinaryOp726", "Unsqueeze727", "BinaryOp729", "Unsqueeze730", "StridedSlice733", "Squeeze734", "BinaryOp735", "BinaryOp736", "/Gather_21_output_0", "/Div_3_output_0", "/Unsqueeze_39_output_0", "/Slice_5_output_0", "/Neg_2_output_0", "/Unsqueeze_38_output_0", "/Slice_4_output_0", "/Concat_16_output_0", "/Mul_9_output_0", "/Add_6_output_0", "/FakeLinear_5_output_0", "/Unsqueeze_34_output_0", "/Unsqueeze_35_output_0", "/Concat_14_output_0", "/Reshape_11_output_0", "/k_norm_1/Cast_output_0", "/k_norm_1/Mul_1_output_0", "/Mul_10_output_0", "/Shape_17_output_0", "Shape619", "Rank621", "BinaryOp623", "Unsqueeze624", "BinaryOp626", "Unsqueeze627", "StridedSlice630", "Squeeze631", "BinaryOp632", "BinaryOp633", "/Gather_22_output_0", "/Div_4_output_0", "/Unsqueeze_41_output_0", "/Slice_7_output_0", "/Neg_3_output_0", "/Unsqueeze_40_output_0", "/Slice_6_output_0", "/Concat_17_output_0", "/Mul_11_output_0", "/Add_7_output_0", "/FakeLinear_6_output_0", "/Unsqueeze_36_output_0", "/Unsqueeze_37_output_0", "/Concat_15_output_0", "/Reshape_12_output_0", "/Reshape_17_output_0", "/FakeLinear_7_output_0", "/Add_9_output_0", "/post_attention_layernorm_1/Mul_1_output_0", "/mlp/gate_proj_1/FakeLinear_output_0", "/mlp/act_fn_1/Mul_output_0", "/mlp/up_proj_1/FakeLinear_output_0", "/mlp_1/Mul_output_0", "/mlp/down_proj_1/FakeLinear_output_0", "/Add_10_output_0", "Unsqueeze956", "Unsqueeze959", "StridedSlice962", "Squeeze963", "BinaryOp964", "BinaryOp965", "/Gather_33_output_0", "/Add_11_output_0", "/Reshape_18_output_0", "/input_layernorm_2/Mul_1_output_0", "/FakeLinear_8_output_0", "/Shape_28_output_0", "Shape978", "Rank980", "BinaryOp982", "Unsqueeze983", "BinaryOp985", "Unsqueeze986", "StridedSlice989", "Squeeze990", "BinaryOp992", "/Gather_35_output_0", "/Unsqueeze_64_output_0", "Unsqueeze1000", "Unsqueeze1003", "StridedSlice1006", "Squeeze1007", "BinaryOp1008", "BinaryOp1009", "/Gather_36_output_0", "/Unsqueeze_65_output_0", "/Concat_26_output_0", "/Reshape_19_output_0", "/q_norm_2/Cast_output_0", "/q_norm_2/Mul_1_output_0", "/Mul_16_output_0", "/Shape_30_output_0", "Shape1127", "Rank1129", "BinaryOp1131", "Unsqueeze1132", "BinaryOp1134", "Unsqueeze1135", "StridedSlice1138", "Squeeze1139", "BinaryOp1140", "BinaryOp1141", "/Gather_37_output_0", "/Div_6_output_0", "/Unsqueeze_71_output_0", "/Slice_9_output_0", "/Neg_4_output_0", "/Unsqueeze_70_output_0", "/Slice_8_output_0", "/Concat_29_output_0", "/Mul_17_output_0", "/Add_12_output_0", "/FakeLinear_9_output_0", "/Unsqueeze_66_output_0", "/Unsqueeze_67_output_0", "/Concat_27_output_0", "/Reshape_20_output_0", "/k_norm_2/Cast_output_0", "/k_norm_2/Mul_1_output_0", "/Mul_18_output_0", "/Shape_31_output_0", "Shape1024", "Rank1026", "BinaryOp1028", "Unsqueeze1029", "BinaryOp1031", "Unsqueeze1032", "StridedSlice1035", "Squeeze1036", "BinaryOp1037", "BinaryOp1038", "/Gather_38_output_0", "/Div_7_output_0", "/Unsqueeze_73_output_0", "/Slice_11_output_0", "/Neg_5_output_0", "/Unsqueeze_72_output_0", "/Slice_10_output_0", "/Concat_30_output_0", "/Mul_19_output_0", "/Add_13_output_0", "/FakeLinear_10_output_0", "/Unsqueeze_68_output_0", "/Unsqueeze_69_output_0", "/Concat_28_output_0", "/Reshape_21_output_0", "/Reshape_26_output_0", "/FakeLinear_11_output_0", "/Add_15_output_0", "/post_attention_layernorm_2/Mul_1_output_0", "/mlp/gate_proj_2/FakeLinear_output_0", "/mlp/act_fn_2/Mul_output_0", "/mlp/up_proj_2/FakeLinear_output_0", "/mlp_2/Mul_output_0", "/mlp/down_proj_2/FakeLinear_output_0", "/Add_16_output_0", "Unsqueeze1361", "Unsqueeze1364", "StridedSlice1367", "Squeeze1368", "BinaryOp1369", "BinaryOp1370", "/Gather_49_output_0", "/Add_17_output_0", "/Reshape_27_output_0", "/input_layernorm_3/Mul_1_output_0", "/FakeLinear_12_output_0", "/Shape_42_output_0", "Shape1383", "Rank1385", "BinaryOp1387", "Unsqueeze1388", "BinaryOp1390", "Unsqueeze1391", "StridedSlice1394", "Squeeze1395", "BinaryOp1397", "/Gather_51_output_0", "/Unsqueeze_96_output_0", "Unsqueeze1405", "Unsqueeze1408", "StridedSlice1411", "Squeeze1412", "BinaryOp1413", "BinaryOp1414", "/Gather_52_output_0", "/Unsqueeze_97_output_0", "/Concat_39_output_0", "/Reshape_28_output_0", "/q_norm_3/Cast_output_0", "/q_norm_3/Mul_1_output_0", "/Mul_24_output_0", "/Shape_44_output_0", "Shape1532", "Rank1534", "BinaryOp1536", "Unsqueeze1537", "BinaryOp1539", "Unsqueeze1540", "StridedSlice1543", "Squeeze1544", "BinaryOp1545", "BinaryOp1546", "/Gather_53_output_0", "/Div_9_output_0", "/Unsqueeze_103_output_0", "/Slice_13_output_0", "/Neg_6_output_0", "/Unsqueeze_102_output_0", "/Slice_12_output_0", "/Concat_42_output_0", "/Mul_25_output_0", "/Add_18_output_0", "/FakeLinear_13_output_0", "/Unsqueeze_98_output_0", "/Unsqueeze_99_output_0", "/Concat_40_output_0", "/Reshape_29_output_0", "/k_norm_3/Cast_output_0", "/k_norm_3/Mul_1_output_0", "/Mul_26_output_0", "/Shape_45_output_0", "Shape1429", "Rank1431", "BinaryOp1433", "Unsqueeze1434", "BinaryOp1436", "Unsqueeze1437", "StridedSlice1440", "Squeeze1441", "BinaryOp1442", "BinaryOp1443", "/Gather_54_output_0", "/Div_10_output_0", "/Unsqueeze_105_output_0", "/Slice_15_output_0", "/Neg_7_output_0", "/Unsqueeze_104_output_0", "/Slice_14_output_0", "/Concat_43_output_0", "/Mul_27_output_0", "/Add_19_output_0", "/FakeLinear_14_output_0", "/Unsqueeze_100_output_0", "/Unsqueeze_101_output_0", "/Concat_41_output_0", "/Reshape_30_output_0", "/Reshape_35_output_0", "/FakeLinear_15_output_0", "/Add_21_output_0", "/post_attention_layernorm_3/Mul_1_output_0", "/mlp/gate_proj_3/FakeLinear_output_0", "/mlp/act_fn_3/Mul_output_0", "/mlp/up_proj_3/FakeLinear_output_0", "/mlp_3/Mul_output_0", "/mlp/down_proj_3/FakeLinear_output_0", "/Add_22_output_0", "/Reshape_36_output_0", "/input_layernorm_4/Mul_1_output_0", "/FakeLinear_16_output_0", "/Shape_56_output_0", "Shape1771", "Rank1773", "BinaryOp1775", "Unsqueeze1776", "BinaryOp1778", "Unsqueeze1779", "StridedSlice1782", "Squeeze1783", "BinaryOp1785", "/Gather_66_output_0", "/Unsqueeze_128_output_0", "Unsqueeze1793", "Unsqueeze1796", "StridedSlice1799", "Squeeze1800", "BinaryOp1801", "BinaryOp1802", "/Gather_67_output_0", "/Unsqueeze_129_output_0", "/Concat_52_output_0", "/Reshape_37_output_0", "/q_norm_4/Cast_output_0", "/q_norm_4/Mul_1_output_0", "/Mul_32_output_0", "/Shape_58_output_0", "Shape1921", "Rank1923", "BinaryOp1925", "Unsqueeze1926", "BinaryOp1928", "Unsqueeze1929", "StridedSlice1932", "Squeeze1933", "BinaryOp1934", "BinaryOp1935", "/Gather_68_output_0", "/Div_12_output_0", "/Unsqueeze_135_output_0", "/Slice_17_output_0", "/Neg_8_output_0", "/Unsqueeze_134_output_0", "/Slice_16_output_0", "/Concat_55_output_0", "/Mul_33_output_0", "/Add_23_output_0", "/FakeLinear_17_output_0", "/Unsqueeze_130_output_0", "/Unsqueeze_131_output_0", "/Concat_53_output_0", "/Reshape_38_output_0", "/k_norm_4/Cast_output_0", "/k_norm_4/Mul_1_output_0", "/Mul_34_output_0", "/Shape_59_output_0", "Shape1817", "Rank1819", "BinaryOp1821", "Unsqueeze1822", "BinaryOp1824", "Unsqueeze1825", "StridedSlice1828", "Squeeze1829", "BinaryOp1830", "BinaryOp1831", "/Gather_69_output_0", "/Div_13_output_0", "/Unsqueeze_137_output_0", "/Slice_19_output_0", "/Neg_9_output_0", "/Unsqueeze_136_output_0", "/Slice_18_output_0", "/Concat_56_output_0", "/Mul_35_output_0", "/Add_24_output_0", "/FakeLinear_18_output_0", "/Unsqueeze_132_output_0", "/Unsqueeze_133_output_0", "/Concat_54_output_0", "/Reshape_39_output_0", "/Reshape_44_output_0", "/FakeLinear_19_output_0", "/Add_26_output_0", "/post_attention_layernorm_4/Mul_1_output_0", "/mlp/gate_proj_4/FakeLinear_output_0", "/mlp/act_fn_4/Mul_output_0", "/mlp/up_proj_4/FakeLinear_output_0", "/mlp_4/Mul_output_0", "/mlp/down_proj_4/FakeLinear_output_0", "/Add_27_output_0", "/Reshape_45_output_0", "/input_layernorm_5/Mul_1_output_0", "/FakeLinear_20_output_0", "/Shape_70_output_0", "Shape2160", "Rank2162", "BinaryOp2164", "Unsqueeze2165", "BinaryOp2167", "Unsqueeze2168", "StridedSlice2171", "Squeeze2172", "BinaryOp2174", "/Gather_81_output_0", "/Unsqueeze_160_output_0", "Unsqueeze2182", "Unsqueeze2185", "StridedSlice2188", "Squeeze2189", "BinaryOp2190", "BinaryOp2191", "/Gather_82_output_0", "/Unsqueeze_161_output_0", "/Concat_65_output_0", "/Reshape_46_output_0", "/q_norm_5/Cast_output_0", "/q_norm_5/Mul_1_output_0", "/Mul_40_output_0", "/Shape_72_output_0", "Shape2310", "Rank2312", "BinaryOp2314", "Unsqueeze2315", "BinaryOp2317", "Unsqueeze2318", "StridedSlice2321", "Squeeze2322", "BinaryOp2323", "BinaryOp2324", "/Gather_83_output_0", "/Div_15_output_0", "/Unsqueeze_167_output_0", "/Slice_21_output_0", "/Neg_10_output_0", "/Unsqueeze_166_output_0", "/Slice_20_output_0", "/Concat_68_output_0", "/Mul_41_output_0", "/Add_28_output_0", "/FakeLinear_21_output_0", "/Unsqueeze_162_output_0", "/Unsqueeze_163_output_0", "/Concat_66_output_0", "/Reshape_47_output_0", "/k_norm_5/Cast_output_0", "/k_norm_5/Mul_1_output_0", "/Mul_42_output_0", "/Shape_73_output_0", "Shape2206", "Rank2208", "BinaryOp2210", "Unsqueeze2211", "BinaryOp2213", "Unsqueeze2214", "StridedSlice2217", "Squeeze2218", "BinaryOp2219", "BinaryOp2220", "/Gather_84_output_0", "/Div_16_output_0", "/Unsqueeze_169_output_0", "/Slice_23_output_0", "/Neg_11_output_0", "/Unsqueeze_168_output_0", "/Slice_22_output_0", "/Concat_69_output_0", "/Mul_43_output_0", "/Add_29_output_0", "/FakeLinear_22_output_0", "/Unsqueeze_164_output_0", "/Unsqueeze_165_output_0", "/Concat_67_output_0", "/Reshape_48_output_0", "/Reshape_53_output_0", "/FakeLinear_23_output_0", "/Add_31_output_0", "/post_attention_layernorm_5/Mul_1_output_0", "/mlp/gate_proj_5/FakeLinear_output_0", "/mlp/act_fn_5/Mul_output_0", "/mlp/up_proj_5/FakeLinear_output_0", "/mlp_5/Mul_output_0", "/mlp/down_proj_5/FakeLinear_output_0", "/Add_32_output_0", "/Reshape_54_output_0", "/input_layernorm_6/Mul_1_output_0", "/FakeLinear_24_output_0", "/Shape_84_output_0", "Shape2549", "Rank2551", "BinaryOp2553", "Unsqueeze2554", "BinaryOp2556", "Unsqueeze2557", "StridedSlice2560", "Squeeze2561", "BinaryOp2563", "/Gather_96_output_0", "/Unsqueeze_192_output_0", "Unsqueeze2571", "Unsqueeze2574", "StridedSlice2577", "Squeeze2578", "BinaryOp2579", "BinaryOp2580", "/Gather_97_output_0", "/Unsqueeze_193_output_0", "/Concat_78_output_0", "/Reshape_55_output_0", "/q_norm_6/Cast_output_0", "/q_norm_6/Mul_1_output_0", "/Mul_48_output_0", "/Shape_86_output_0", "Shape2699", "Rank2701", "BinaryOp2703", "Unsqueeze2704", "BinaryOp2706", "Unsqueeze2707", "StridedSlice2710", "Squeeze2711", "BinaryOp2712", "BinaryOp2713", "/Gather_98_output_0", "/Div_18_output_0", "/Unsqueeze_199_output_0", "/Slice_25_output_0", "/Neg_12_output_0", "/Unsqueeze_198_output_0", "/Slice_24_output_0", "/Concat_81_output_0", "/Mul_49_output_0", "/Add_33_output_0", "/FakeLinear_25_output_0", "/Unsqueeze_194_output_0", "/Unsqueeze_195_output_0", "/Concat_79_output_0", "/Reshape_56_output_0", "/k_norm_6/Cast_output_0", "/k_norm_6/Mul_1_output_0", "/Mul_50_output_0", "/Shape_87_output_0", "Shape2595", "Rank2597", "BinaryOp2599", "Unsqueeze2600", "BinaryOp2602", "Unsqueeze2603", "StridedSlice2606", "Squeeze2607", "BinaryOp2608", "BinaryOp2609", "/Gather_99_output_0", "/Div_19_output_0", "/Unsqueeze_201_output_0", "/Slice_27_output_0", "/Neg_13_output_0", "/Unsqueeze_200_output_0", "/Slice_26_output_0", "/Concat_82_output_0", "/Mul_51_output_0", "/Add_34_output_0", "/FakeLinear_26_output_0", "/Unsqueeze_196_output_0", "/Unsqueeze_197_output_0", "/Concat_80_output_0", "/Reshape_57_output_0", "/Reshape_62_output_0", "/FakeLinear_27_output_0", "/Add_36_output_0", "/post_attention_layernorm_6/Mul_1_output_0", "/mlp/gate_proj_6/FakeLinear_output_0", "/mlp/act_fn_6/Mul_output_0", "/mlp/up_proj_6/FakeLinear_output_0", "/mlp_6/Mul_output_0", "/mlp/down_proj_6/FakeLinear_output_0", "/Add_37_output_0", "/Reshape_63_output_0", "/input_layernorm_7/Mul_1_output_0", "/FakeLinear_28_output_0", "/Shape_98_output_0", "Shape2938", "Rank2940", "BinaryOp2942", "Unsqueeze2943", "BinaryOp2945", "Unsqueeze2946", "StridedSlice2949", "Squeeze2950", "BinaryOp2952", "/Gather_111_output_0", "/Unsqueeze_224_output_0", "Unsqueeze2960", "Unsqueeze2963", "StridedSlice2966", "Squeeze2967", "BinaryOp2968", "BinaryOp2969", "/Gather_112_output_0", "/Unsqueeze_225_output_0", "/Concat_91_output_0", "/Reshape_64_output_0", "/q_norm_7/Cast_output_0", "/q_norm_7/Mul_1_output_0", "/Mul_56_output_0", "/Shape_100_output_0", "Shape3088", "Rank3090", "BinaryOp3092", "Unsqueeze3093", "BinaryOp3095", "Unsqueeze3096", "StridedSlice3099", "Squeeze3100", "BinaryOp3101", "BinaryOp3102", "/Gather_113_output_0", "/Div_21_output_0", "/Unsqueeze_231_output_0", "/Slice_29_output_0", "/Neg_14_output_0", "/Unsqueeze_230_output_0", "/Slice_28_output_0", "/Concat_94_output_0", "/Mul_57_output_0", "/Add_38_output_0", "/FakeLinear_29_output_0", "/Unsqueeze_226_output_0", "/Unsqueeze_227_output_0", "/Concat_92_output_0", "/Reshape_65_output_0", "/k_norm_7/Cast_output_0", "/k_norm_7/Mul_1_output_0", "/Mul_58_output_0", "/Shape_101_output_0", "Shape2984", "Rank2986", "BinaryOp2988", "Unsqueeze2989", "BinaryOp2991", "Unsqueeze2992", "StridedSlice2995", "Squeeze2996", "BinaryOp2997", "BinaryOp2998", "/Gather_114_output_0", "/Div_22_output_0", "/Unsqueeze_233_output_0", "/Slice_31_output_0", "/Neg_15_output_0", "/Unsqueeze_232_output_0", "/Slice_30_output_0", "/Concat_95_output_0", "/Mul_59_output_0", "/Add_39_output_0", "/FakeLinear_30_output_0", "/Unsqueeze_228_output_0", "/Unsqueeze_229_output_0", "/Concat_93_output_0", "/Reshape_66_output_0", "/Reshape_71_output_0", "/FakeLinear_31_output_0", "/Add_41_output_0", "/post_attention_layernorm_7/Mul_1_output_0", "/mlp/gate_proj_7/FakeLinear_output_0", "/mlp/act_fn_7/Mul_output_0", "/mlp/up_proj_7/FakeLinear_output_0", "/mlp_7/Mul_output_0", "/mlp/down_proj_7/FakeLinear_output_0", "/Add_42_output_0", "/Reshape_72_output_0", "/input_layernorm_8/Mul_1_output_0", "/FakeLinear_32_output_0", "/Shape_112_output_0", "Shape3327", "Rank3329", "BinaryOp3331", "Unsqueeze3332", "BinaryOp3334", "Unsqueeze3335", "StridedSlice3338", "Squeeze3339", "BinaryOp3341", "/Gather_126_output_0", "/Unsqueeze_256_output_0", "Unsqueeze3349", "Unsqueeze3352", "StridedSlice3355", "Squeeze3356", "BinaryOp3357", "BinaryOp3358", "/Gather_127_output_0", "/Unsqueeze_257_output_0", "/Concat_104_output_0", "/Reshape_73_output_0", "/q_norm_8/Cast_output_0", "/q_norm_8/Mul_1_output_0", "/Mul_64_output_0", "/Shape_114_output_0", "Shape3477", "Rank3479", "BinaryOp3481", "Unsqueeze3482", "BinaryOp3484", "Unsqueeze3485", "StridedSlice3488", "Squeeze3489", "BinaryOp3490", "BinaryOp3491", "/Gather_128_output_0", "/Div_24_output_0", "/Unsqueeze_263_output_0", "/Slice_33_output_0", "/Neg_16_output_0", "/Unsqueeze_262_output_0", "/Slice_32_output_0", "/Concat_107_output_0", "/Mul_65_output_0", "/Add_43_output_0", "/FakeLinear_33_output_0", "/Unsqueeze_258_output_0", "/Unsqueeze_259_output_0", "/Concat_105_output_0", "/Reshape_74_output_0", "/k_norm_8/Cast_output_0", "/k_norm_8/Mul_1_output_0", "/Mul_66_output_0", "/Shape_115_output_0", "Shape3373", "Rank3375", "BinaryOp3377", "Unsqueeze3378", "BinaryOp3380", "Unsqueeze3381", "StridedSlice3384", "Squeeze3385", "BinaryOp3386", "BinaryOp3387", "/Gather_129_output_0", "/Div_25_output_0", "/Unsqueeze_265_output_0", "/Slice_35_output_0", "/Neg_17_output_0", "/Unsqueeze_264_output_0", "/Slice_34_output_0", "/Concat_108_output_0", "/Mul_67_output_0", "/Add_44_output_0", "/FakeLinear_34_output_0", "/Unsqueeze_260_output_0", "/Unsqueeze_261_output_0", "/Concat_106_output_0", "/Reshape_75_output_0", "/Reshape_80_output_0", "/FakeLinear_35_output_0", "/Add_46_output_0", "/post_attention_layernorm_8/Mul_1_output_0", "/mlp/gate_proj_8/FakeLinear_output_0", "/mlp/act_fn_8/Mul_output_0", "/mlp/up_proj_8/FakeLinear_output_0", "/mlp_8/Mul_output_0", "/mlp/down_proj_8/FakeLinear_output_0", "/Add_47_output_0", "/Reshape_81_output_0", "/input_layernorm_9/Mul_1_output_0", "/FakeLinear_36_output_0", "/Shape_126_output_0", "Shape3716", "Rank3718", "BinaryOp3720", "Unsqueeze3721", "BinaryOp3723", "Unsqueeze3724", "StridedSlice3727", "Squeeze3728", "BinaryOp3730", "/Gather_141_output_0", "/Unsqueeze_288_output_0", "Unsqueeze3738", "Unsqueeze3741", "StridedSlice3744", "Squeeze3745", "BinaryOp3746", "BinaryOp3747", "/Gather_142_output_0", "/Unsqueeze_289_output_0", "/Concat_117_output_0", "/Reshape_82_output_0", "/q_norm_9/Cast_output_0", "/q_norm_9/Mul_1_output_0", "/Mul_72_output_0", "/Shape_128_output_0", "Shape3866", "Rank3868", "BinaryOp3870", "Unsqueeze3871", "BinaryOp3873", "Unsqueeze3874", "StridedSlice3877", "Squeeze3878", "BinaryOp3879", "BinaryOp3880", "/Gather_143_output_0", "/Div_27_output_0", "/Unsqueeze_295_output_0", "/Slice_37_output_0", "/Neg_18_output_0", "/Unsqueeze_294_output_0", "/Slice_36_output_0", "/Concat_120_output_0", "/Mul_73_output_0", "/Add_48_output_0", "/FakeLinear_37_output_0", "/Unsqueeze_290_output_0", "/Unsqueeze_291_output_0", "/Concat_118_output_0", "/Reshape_83_output_0", "/k_norm_9/Cast_output_0", "/k_norm_9/Mul_1_output_0", "/Mul_74_output_0", "/Shape_129_output_0", "Shape3762", "Rank3764", "BinaryOp3766", "Unsqueeze3767", "BinaryOp3769", "Unsqueeze3770", "StridedSlice3773", "Squeeze3774", "BinaryOp3775", "BinaryOp3776", "/Gather_144_output_0", "/Div_28_output_0", "/Unsqueeze_297_output_0", "/Slice_39_output_0", "/Neg_19_output_0", "/Unsqueeze_296_output_0", "/Slice_38_output_0", "/Concat_121_output_0", "/Mul_75_output_0", "/Add_49_output_0", "/FakeLinear_38_output_0", "/Unsqueeze_292_output_0", "/Unsqueeze_293_output_0", "/Concat_119_output_0", "/Reshape_84_output_0", "/Reshape_89_output_0", "/FakeLinear_39_output_0", "/Add_51_output_0", "/post_attention_layernorm_9/Mul_1_output_0", "/mlp/gate_proj_9/FakeLinear_output_0", "/mlp/act_fn_9/Mul_output_0", "/mlp/up_proj_9/FakeLinear_output_0", "/mlp_9/Mul_output_0", "/mlp/down_proj_9/FakeLinear_output_0", "/Add_52_output_0", "/Reshape_90_output_0", "/input_layernorm_10/Mul_1_output_0", "/FakeLinear_40_output_0", "/Shape_140_output_0", "Shape4105", "Rank4107", "BinaryOp4109", "Unsqueeze4110", "BinaryOp4112", "Unsqueeze4113", "StridedSlice4116", "Squeeze4117", "BinaryOp4119", "/Gather_156_output_0", "/Unsqueeze_320_output_0", "Unsqueeze4127", "Unsqueeze4130", "StridedSlice4133", "Squeeze4134", "BinaryOp4135", "BinaryOp4136", "/Gather_157_output_0", "/Unsqueeze_321_output_0", "/Concat_130_output_0", "/Reshape_91_output_0", "/q_norm_10/Cast_output_0", "/q_norm_10/Mul_1_output_0", "/Mul_80_output_0", "/Shape_142_output_0", "Shape4255", "Rank4257", "BinaryOp4259", "Unsqueeze4260", "BinaryOp4262", "Unsqueeze4263", "StridedSlice4266", "Squeeze4267", "BinaryOp4268", "BinaryOp4269", "/Gather_158_output_0", "/Div_30_output_0", "/Unsqueeze_327_output_0", "/Slice_41_output_0", "/Neg_20_output_0", "/Unsqueeze_326_output_0", "/Slice_40_output_0", "/Concat_133_output_0", "/Mul_81_output_0", "/Add_53_output_0", "/FakeLinear_41_output_0", "/Unsqueeze_322_output_0", "/Unsqueeze_323_output_0", "/Concat_131_output_0", "/Reshape_92_output_0", "/k_norm_10/Cast_output_0", "/k_norm_10/Mul_1_output_0", "/Mul_82_output_0", "/Shape_143_output_0", "Shape4151", "Rank4153", "BinaryOp4155", "Unsqueeze4156", "BinaryOp4158", "Unsqueeze4159", "StridedSlice4162", "Squeeze4163", "BinaryOp4164", "BinaryOp4165", "/Gather_159_output_0", "/Div_31_output_0", "/Unsqueeze_329_output_0", "/Slice_43_output_0", "/Neg_21_output_0", "/Unsqueeze_328_output_0", "/Slice_42_output_0", "/Concat_134_output_0", "/Mul_83_output_0", "/Add_54_output_0", "/FakeLinear_42_output_0", "/Unsqueeze_324_output_0", "/Unsqueeze_325_output_0", "/Concat_132_output_0", "/Reshape_93_output_0", "/Reshape_98_output_0", "/FakeLinear_43_output_0", "/Add_56_output_0", "/post_attention_layernorm_10/Mul_1_output_0", "/mlp/gate_proj_10/FakeLinear_output_0", "/mlp/act_fn_10/Mul_output_0", "/mlp/up_proj_10/FakeLinear_output_0", "/mlp_10/Mul_output_0", "/mlp/down_proj_10/FakeLinear_output_0", "/Add_57_output_0", "/Reshape_99_output_0", "/input_layernorm_11/Mul_1_output_0", "/FakeLinear_44_output_0", "/Shape_154_output_0", "Shape4494", "Rank4496", "BinaryOp4498", "Unsqueeze4499", "BinaryOp4501", "Unsqueeze4502", "StridedSlice4505", "Squeeze4506", "BinaryOp4508", "/Gather_171_output_0", "/Unsqueeze_352_output_0", "Unsqueeze4516", "Unsqueeze4519", "StridedSlice4522", "Squeeze4523", "BinaryOp4524", "BinaryOp4525", "/Gather_172_output_0", "/Unsqueeze_353_output_0", "/Concat_143_output_0", "/Reshape_100_output_0", "/q_norm_11/Cast_output_0", "/q_norm_11/Mul_1_output_0", "/Mul_88_output_0", "/Shape_156_output_0", "Shape4644", "Rank4646", "BinaryOp4648", "Unsqueeze4649", "BinaryOp4651", "Unsqueeze4652", "StridedSlice4655", "Squeeze4656", "BinaryOp4657", "BinaryOp4658", "/Gather_173_output_0", "/Div_33_output_0", "/Unsqueeze_359_output_0", "/Slice_45_output_0", "/Neg_22_output_0", "/Unsqueeze_358_output_0", "/Slice_44_output_0", "/Concat_146_output_0", "/Mul_89_output_0", "/Add_58_output_0", "/FakeLinear_45_output_0", "/Unsqueeze_354_output_0", "/Unsqueeze_355_output_0", "/Concat_144_output_0", "/Reshape_101_output_0", "/k_norm_11/Cast_output_0", "/k_norm_11/Mul_1_output_0", "/Mul_90_output_0", "/Shape_157_output_0", "Shape4540", "Rank4542", "BinaryOp4544", "Unsqueeze4545", "BinaryOp4547", "Unsqueeze4548", "StridedSlice4551", "Squeeze4552", "BinaryOp4553", "BinaryOp4554", "/Gather_174_output_0", "/Div_34_output_0", "/Unsqueeze_361_output_0", "/Slice_47_output_0", "/Neg_23_output_0", "/Unsqueeze_360_output_0", "/Slice_46_output_0", "/Concat_147_output_0", "/Mul_91_output_0", "/Add_59_output_0", "/FakeLinear_46_output_0", "/Unsqueeze_356_output_0", "/Unsqueeze_357_output_0", "/Concat_145_output_0", "/Reshape_102_output_0", "/Reshape_107_output_0", "/FakeLinear_47_output_0", "/Add_61_output_0", "/post_attention_layernorm_11/Mul_1_output_0", "/mlp/gate_proj_11/FakeLinear_output_0", "/mlp/act_fn_11/Mul_output_0", "/mlp/up_proj_11/FakeLinear_output_0", "/mlp_11/Mul_output_0", "/mlp/down_proj_11/FakeLinear_output_0", "/Add_62_output_0", "/Reshape_108_output_0", "/input_layernorm_12/Mul_1_output_0", "/FakeLinear_48_output_0", "/Shape_168_output_0", "Shape4883", "Rank4885", "BinaryOp4887", "Unsqueeze4888", "BinaryOp4890", "Unsqueeze4891", "StridedSlice4894", "Squeeze4895", "BinaryOp4897", "/Gather_186_output_0", "/Unsqueeze_384_output_0", "Unsqueeze4905", "Unsqueeze4908", "StridedSlice4911", "Squeeze4912", "BinaryOp4913", "BinaryOp4914", "/Gather_187_output_0", "/Unsqueeze_385_output_0", "/Concat_156_output_0", "/Reshape_109_output_0", "/q_norm_12/Cast_output_0", "/q_norm_12/Mul_1_output_0", "/Mul_96_output_0", "/Shape_170_output_0", "Shape5033", "Rank5035", "BinaryOp5037", "Unsqueeze5038", "BinaryOp5040", "Unsqueeze5041", "StridedSlice5044", "Squeeze5045", "BinaryOp5046", "BinaryOp5047", "/Gather_188_output_0", "/Div_36_output_0", "/Unsqueeze_391_output_0", "/Slice_49_output_0", "/Neg_24_output_0", "/Unsqueeze_390_output_0", "/Slice_48_output_0", "/Concat_159_output_0", "/Mul_97_output_0", "/Add_63_output_0", "/FakeLinear_49_output_0", "/Unsqueeze_386_output_0", "/Unsqueeze_387_output_0", "/Concat_157_output_0", "/Reshape_110_output_0", "/k_norm_12/Cast_output_0", "/k_norm_12/Mul_1_output_0", "/Mul_98_output_0", "/Shape_171_output_0", "Shape4929", "Rank4931", "BinaryOp4933", "Unsqueeze4934", "BinaryOp4936", "Unsqueeze4937", "StridedSlice4940", "Squeeze4941", "BinaryOp4942", "BinaryOp4943", "/Gather_189_output_0", "/Div_37_output_0", "/Unsqueeze_393_output_0", "/Slice_51_output_0", "/Neg_25_output_0", "/Unsqueeze_392_output_0", "/Slice_50_output_0", "/Concat_160_output_0", "/Mul_99_output_0", "/Add_64_output_0", "/FakeLinear_50_output_0", "/Unsqueeze_388_output_0", "/Unsqueeze_389_output_0", "/Concat_158_output_0", "/Reshape_111_output_0", "/Reshape_116_output_0", "/FakeLinear_51_output_0", "/Add_66_output_0", "/post_attention_layernorm_12/Mul_1_output_0", "/mlp/gate_proj_12/FakeLinear_output_0", "/mlp/act_fn_12/Mul_output_0", "/mlp/up_proj_12/FakeLinear_output_0", "/mlp_12/Mul_output_0", "/mlp/down_proj_12/FakeLinear_output_0", "/Add_67_output_0", "/Reshape_117_output_0", "/input_layernorm_13/Mul_1_output_0", "/FakeLinear_52_output_0", "/Shape_182_output_0", "Shape5272", "Rank5274", "BinaryOp5276", "Unsqueeze5277", "BinaryOp5279", "Unsqueeze5280", "StridedSlice5283", "Squeeze5284", "BinaryOp5286", "/Gather_201_output_0", "/Unsqueeze_416_output_0", "Unsqueeze5294", "Unsqueeze5297", "StridedSlice5300", "Squeeze5301", "BinaryOp5302", "BinaryOp5303", "/Gather_202_output_0", "/Unsqueeze_417_output_0", "/Concat_169_output_0", "/Reshape_118_output_0", "/q_norm_13/Cast_output_0", "/q_norm_13/Mul_1_output_0", "/Mul_104_output_0", "/Shape_184_output_0", "Shape5422", "Rank5424", "BinaryOp5426", "Unsqueeze5427", "BinaryOp5429", "Unsqueeze5430", "StridedSlice5433", "Squeeze5434", "BinaryOp5435", "BinaryOp5436", "/Gather_203_output_0", "/Div_39_output_0", "/Unsqueeze_423_output_0", "/Slice_53_output_0", "/Neg_26_output_0", "/Unsqueeze_422_output_0", "/Slice_52_output_0", "/Concat_172_output_0", "/Mul_105_output_0", "/Add_68_output_0", "/FakeLinear_53_output_0", "/Unsqueeze_418_output_0", "/Unsqueeze_419_output_0", "/Concat_170_output_0", "/Reshape_119_output_0", "/k_norm_13/Cast_output_0", "/k_norm_13/Mul_1_output_0", "/Mul_106_output_0", "/Shape_185_output_0", "Shape5318", "Rank5320", "BinaryOp5322", "Unsqueeze5323", "BinaryOp5325", "Unsqueeze5326", "StridedSlice5329", "Squeeze5330", "BinaryOp5331", "BinaryOp5332", "/Gather_204_output_0", "/Div_40_output_0", "/Unsqueeze_425_output_0", "/Slice_55_output_0", "/Neg_27_output_0", "/Unsqueeze_424_output_0", "/Slice_54_output_0", "/Concat_173_output_0", "/Mul_107_output_0", "/Add_69_output_0", "/FakeLinear_54_output_0", "/Unsqueeze_420_output_0", "/Unsqueeze_421_output_0", "/Concat_171_output_0", "/Reshape_120_output_0", "/Reshape_125_output_0", "/FakeLinear_55_output_0", "/Add_71_output_0", "/post_attention_layernorm_13/Mul_1_output_0", "/mlp/gate_proj_13/FakeLinear_output_0", "/mlp/act_fn_13/Mul_output_0", "/mlp/up_proj_13/FakeLinear_output_0", "/mlp_13/Mul_output_0", "/mlp/down_proj_13/FakeLinear_output_0", "/Add_72_output_0", "/Reshape_126_output_0", "/input_layernorm_14/Mul_1_output_0", "/FakeLinear_56_output_0", "/Shape_196_output_0", "Shape5661", "Rank5663", "BinaryOp5665", "Unsqueeze5666", "BinaryOp5668", "Unsqueeze5669", "StridedSlice5672", "Squeeze5673", "BinaryOp5675", "/Gather_216_output_0", "/Unsqueeze_448_output_0", "Unsqueeze5683", "Unsqueeze5686", "StridedSlice5689", "Squeeze5690", "BinaryOp5691", "BinaryOp5692", "/Gather_217_output_0", "/Unsqueeze_449_output_0", "/Concat_182_output_0", "/Reshape_127_output_0", "/q_norm_14/Cast_output_0", "/q_norm_14/Mul_1_output_0", "/Mul_112_output_0", "/Shape_198_output_0", "Shape5811", "Rank5813", "BinaryOp5815", "Unsqueeze5816", "BinaryOp5818", "Unsqueeze5819", "StridedSlice5822", "Squeeze5823", "BinaryOp5824", "BinaryOp5825", "/Gather_218_output_0", "/Div_42_output_0", "/Unsqueeze_455_output_0", "/Slice_57_output_0", "/Neg_28_output_0", "/Unsqueeze_454_output_0", "/Slice_56_output_0", "/Concat_185_output_0", "/Mul_113_output_0", "/Add_73_output_0", "/FakeLinear_57_output_0", "/Unsqueeze_450_output_0", "/Unsqueeze_451_output_0", "/Concat_183_output_0", "/Reshape_128_output_0", "/k_norm_14/Cast_output_0", "/k_norm_14/Mul_1_output_0", "/Mul_114_output_0", "/Shape_199_output_0", "Shape5707", "Rank5709", "BinaryOp5711", "Unsqueeze5712", "BinaryOp5714", "Unsqueeze5715", "StridedSlice5718", "Squeeze5719", "BinaryOp5720", "BinaryOp5721", "/Gather_219_output_0", "/Div_43_output_0", "/Unsqueeze_457_output_0", "/Slice_59_output_0", "/Neg_29_output_0", "/Unsqueeze_456_output_0", "/Slice_58_output_0", "/Concat_186_output_0", "/Mul_115_output_0", "/Add_74_output_0", "/FakeLinear_58_output_0", "/Unsqueeze_452_output_0", "/Unsqueeze_453_output_0", "/Concat_184_output_0", "/Reshape_129_output_0", "/Reshape_134_output_0", "/FakeLinear_59_output_0", "/Add_76_output_0", "/post_attention_layernorm_14/Mul_1_output_0", "/mlp/gate_proj_14/FakeLinear_output_0", "/mlp/act_fn_14/Mul_output_0", "/mlp/up_proj_14/FakeLinear_output_0", "/mlp_14/Mul_output_0", "/mlp/down_proj_14/FakeLinear_output_0", "/Add_77_output_0", "/Reshape_135_output_0", "/input_layernorm_15/Mul_1_output_0", "/FakeLinear_60_output_0", "/Shape_210_output_0", "Shape6050", "Rank6052", "BinaryOp6054", "Unsqueeze6055", "BinaryOp6057", "Unsqueeze6058", "StridedSlice6061", "Squeeze6062", "BinaryOp6064", "/Gather_231_output_0", "/Unsqueeze_480_output_0", "Unsqueeze6072", "Unsqueeze6075", "StridedSlice6078", "Squeeze6079", "BinaryOp6080", "BinaryOp6081", "/Gather_232_output_0", "/Unsqueeze_481_output_0", "/Concat_195_output_0", "/Reshape_136_output_0", "/q_norm_15/Cast_output_0", "/q_norm_15/Mul_1_output_0", "/Mul_120_output_0", "/Shape_212_output_0", "Shape6200", "Rank6202", "BinaryOp6204", "Unsqueeze6205", "BinaryOp6207", "Unsqueeze6208", "StridedSlice6211", "Squeeze6212", "BinaryOp6213", "BinaryOp6214", "/Gather_233_output_0", "/Div_45_output_0", "/Unsqueeze_487_output_0", "/Slice_61_output_0", "/Neg_30_output_0", "/Unsqueeze_486_output_0", "/Slice_60_output_0", "/Concat_198_output_0", "/Mul_121_output_0", "/Add_78_output_0", "/FakeLinear_61_output_0", "/Unsqueeze_482_output_0", "/Unsqueeze_483_output_0", "/Concat_196_output_0", "/Reshape_137_output_0", "/k_norm_15/Cast_output_0", "/k_norm_15/Mul_1_output_0", "/Mul_122_output_0", "/Shape_213_output_0", "Shape6096", "Rank6098", "BinaryOp6100", "Unsqueeze6101", "BinaryOp6103", "Unsqueeze6104", "StridedSlice6107", "Squeeze6108", "BinaryOp6109", "BinaryOp6110", "/Gather_234_output_0", "/Div_46_output_0", "/Unsqueeze_489_output_0", "/Slice_63_output_0", "/Neg_31_output_0", "/Unsqueeze_488_output_0", "/Slice_62_output_0", "/Concat_199_output_0", "/Mul_123_output_0", "/Add_79_output_0", "/FakeLinear_62_output_0", "/Unsqueeze_484_output_0", "/Unsqueeze_485_output_0", "/Concat_197_output_0", "/Reshape_138_output_0", "/Reshape_143_output_0", "/FakeLinear_63_output_0", "/Add_81_output_0", "/post_attention_layernorm_15/Mul_1_output_0", "/mlp/gate_proj_15/FakeLinear_output_0", "/mlp/act_fn_15/Mul_output_0", "/mlp/up_proj_15/FakeLinear_output_0", "/mlp_15/Mul_output_0", "/mlp/down_proj_15/FakeLinear_output_0", "/Add_82_output_0", "/Reshape_144_output_0", "/input_layernorm_16/Mul_1_output_0", "/FakeLinear_64_output_0", "/Shape_224_output_0", "Shape6439", "Rank6441", "BinaryOp6443", "Unsqueeze6444", "BinaryOp6446", "Unsqueeze6447", "StridedSlice6450", "Squeeze6451", "BinaryOp6453", "/Gather_246_output_0", "/Unsqueeze_512_output_0", "Unsqueeze6461", "Unsqueeze6464", "StridedSlice6467", "Squeeze6468", "BinaryOp6469", "BinaryOp6470", "/Gather_247_output_0", "/Unsqueeze_513_output_0", "/Concat_208_output_0", "/Reshape_145_output_0", "/q_norm_16/Cast_output_0", "/q_norm_16/Mul_1_output_0", "/Mul_128_output_0", "/Shape_226_output_0", "Shape6589", "Rank6591", "BinaryOp6593", "Unsqueeze6594", "BinaryOp6596", "Unsqueeze6597", "StridedSlice6600", "Squeeze6601", "BinaryOp6602", "BinaryOp6603", "/Gather_248_output_0", "/Div_48_output_0", "/Unsqueeze_519_output_0", "/Slice_65_output_0", "/Neg_32_output_0", "/Unsqueeze_518_output_0", "/Slice_64_output_0", "/Concat_211_output_0", "/Mul_129_output_0", "/Add_83_output_0", "/FakeLinear_65_output_0", "/Unsqueeze_514_output_0", "/Unsqueeze_515_output_0", "/Concat_209_output_0", "/Reshape_146_output_0", "/k_norm_16/Cast_output_0", "/k_norm_16/Mul_1_output_0", "/Mul_130_output_0", "/Shape_227_output_0", "Shape6485", "Rank6487", "BinaryOp6489", "Unsqueeze6490", "BinaryOp6492", "Unsqueeze6493", "StridedSlice6496", "Squeeze6497", "BinaryOp6498", "BinaryOp6499", "/Gather_249_output_0", "/Div_49_output_0", "/Unsqueeze_521_output_0", "/Slice_67_output_0", "/Neg_33_output_0", "/Unsqueeze_520_output_0", "/Slice_66_output_0", "/Concat_212_output_0", "/Mul_131_output_0", "/Add_84_output_0", "/FakeLinear_66_output_0", "/Unsqueeze_516_output_0", "/Unsqueeze_517_output_0", "/Concat_210_output_0", "/Reshape_147_output_0", "/Reshape_152_output_0", "/FakeLinear_67_output_0", "/Add_86_output_0", "/post_attention_layernorm_16/Mul_1_output_0", "/mlp/gate_proj_16/FakeLinear_output_0", "/mlp/act_fn_16/Mul_output_0", "/mlp/up_proj_16/FakeLinear_output_0", "/mlp_16/Mul_output_0", "/mlp/down_proj_16/FakeLinear_output_0", "/Add_87_output_0", "/Reshape_153_output_0", "/input_layernorm_17/Mul_1_output_0", "/FakeLinear_68_output_0", "/Shape_238_output_0", "Shape6828", "Rank6830", "BinaryOp6832", "Unsqueeze6833", "BinaryOp6835", "Unsqueeze6836", "StridedSlice6839", "Squeeze6840", "BinaryOp6842", "/Gather_261_output_0", "/Unsqueeze_544_output_0", "Unsqueeze6850", "Unsqueeze6853", "StridedSlice6856", "Squeeze6857", "BinaryOp6858", "BinaryOp6859", "/Gather_262_output_0", "/Unsqueeze_545_output_0", "/Concat_221_output_0", "/Reshape_154_output_0", "/q_norm_17/Cast_output_0", "/q_norm_17/Mul_1_output_0", "/Mul_136_output_0", "/Shape_240_output_0", "Shape6978", "Rank6980", "BinaryOp6982", "Unsqueeze6983", "BinaryOp6985", "Unsqueeze6986", "StridedSlice6989", "Squeeze6990", "BinaryOp6991", "BinaryOp6992", "/Gather_263_output_0", "/Div_51_output_0", "/Unsqueeze_551_output_0", "/Slice_69_output_0", "/Neg_34_output_0", "/Unsqueeze_550_output_0", "/Slice_68_output_0", "/Concat_224_output_0", "/Mul_137_output_0", "/Add_88_output_0", "/FakeLinear_69_output_0", "/Unsqueeze_546_output_0", "/Unsqueeze_547_output_0", "/Concat_222_output_0", "/Reshape_155_output_0", "/k_norm_17/Cast_output_0", "/k_norm_17/Mul_1_output_0", "/Mul_138_output_0", "/Shape_241_output_0", "Shape6874", "Rank6876", "BinaryOp6878", "Unsqueeze6879", "BinaryOp6881", "Unsqueeze6882", "StridedSlice6885", "Squeeze6886", "BinaryOp6887", "BinaryOp6888", "/Gather_264_output_0", "/Div_52_output_0", "/Unsqueeze_553_output_0", "/Slice_71_output_0", "/Neg_35_output_0", "/Unsqueeze_552_output_0", "/Slice_70_output_0", "/Concat_225_output_0", "/Mul_139_output_0", "/Add_89_output_0", "/FakeLinear_70_output_0", "/Unsqueeze_548_output_0", "/Unsqueeze_549_output_0", "/Concat_223_output_0", "/Reshape_156_output_0", "/Reshape_161_output_0", "/FakeLinear_71_output_0", "/Add_91_output_0", "/post_attention_layernorm_17/Mul_1_output_0", "/mlp/gate_proj_17/FakeLinear_output_0", "/mlp/act_fn_17/Mul_output_0", "/mlp/up_proj_17/FakeLinear_output_0", "/mlp_17/Mul_output_0", "/mlp/down_proj_17/FakeLinear_output_0", "/Add_92_output_0", "/Reshape_162_output_0", "/input_layernorm_18/Mul_1_output_0", "/FakeLinear_72_output_0", "/Shape_252_output_0", "Shape7217", "Rank7219", "BinaryOp7221", "Unsqueeze7222", "BinaryOp7224", "Unsqueeze7225", "StridedSlice7228", "Squeeze7229", "BinaryOp7231", "/Gather_276_output_0", "/Unsqueeze_576_output_0", "Unsqueeze7239", "Unsqueeze7242", "StridedSlice7245", "Squeeze7246", "BinaryOp7247", "BinaryOp7248", "/Gather_277_output_0", "/Unsqueeze_577_output_0", "/Concat_234_output_0", "/Reshape_163_output_0", "/q_norm_18/Cast_output_0", "/q_norm_18/Mul_1_output_0", "/Mul_144_output_0", "/Shape_254_output_0", "Shape7367", "Rank7369", "BinaryOp7371", "Unsqueeze7372", "BinaryOp7374", "Unsqueeze7375", "StridedSlice7378", "Squeeze7379", "BinaryOp7380", "BinaryOp7381", "/Gather_278_output_0", "/Div_54_output_0", "/Unsqueeze_583_output_0", "/Slice_73_output_0", "/Neg_36_output_0", "/Unsqueeze_582_output_0", "/Slice_72_output_0", "/Concat_237_output_0", "/Mul_145_output_0", "/Add_93_output_0", "/FakeLinear_73_output_0", "/Unsqueeze_578_output_0", "/Unsqueeze_579_output_0", "/Concat_235_output_0", "/Reshape_164_output_0", "/k_norm_18/Cast_output_0", "/k_norm_18/Mul_1_output_0", "/Mul_146_output_0", "/Shape_255_output_0", "Shape7263", "Rank7265", "BinaryOp7267", "Unsqueeze7268", "BinaryOp7270", "Unsqueeze7271", "StridedSlice7274", "Squeeze7275", "BinaryOp7276", "BinaryOp7277", "/Gather_279_output_0", "/Div_55_output_0", "/Unsqueeze_585_output_0", "/Slice_75_output_0", "/Neg_37_output_0", "/Unsqueeze_584_output_0", "/Slice_74_output_0", "/Concat_238_output_0", "/Mul_147_output_0", "/Add_94_output_0", "/FakeLinear_74_output_0", "/Unsqueeze_580_output_0", "/Unsqueeze_581_output_0", "/Concat_236_output_0", "/Reshape_165_output_0", "/Reshape_170_output_0", "/FakeLinear_75_output_0", "/Add_96_output_0", "/post_attention_layernorm_18/Mul_1_output_0", "/mlp/gate_proj_18/FakeLinear_output_0", "/mlp/act_fn_18/Mul_output_0", "/mlp/up_proj_18/FakeLinear_output_0", "/mlp_18/Mul_output_0", "/mlp/down_proj_18/FakeLinear_output_0", "/Add_97_output_0", "/Reshape_171_output_0", "/input_layernorm_19/Mul_1_output_0", "/FakeLinear_76_output_0", "/Shape_266_output_0", "Shape7606", "Rank7608", "BinaryOp7610", "Unsqueeze7611", "BinaryOp7613", "Unsqueeze7614", "StridedSlice7617", "Squeeze7618", "BinaryOp7620", "/Gather_291_output_0", "/Unsqueeze_608_output_0", "Unsqueeze7628", "Unsqueeze7631", "StridedSlice7634", "Squeeze7635", "BinaryOp7636", "BinaryOp7637", "/Gather_292_output_0", "/Unsqueeze_609_output_0", "/Concat_247_output_0", "/Reshape_172_output_0", "/q_norm_19/Cast_output_0", "/q_norm_19/Mul_1_output_0", "/Mul_152_output_0", "/Shape_268_output_0", "Shape7756", "Rank7758", "BinaryOp7760", "Unsqueeze7761", "BinaryOp7763", "Unsqueeze7764", "StridedSlice7767", "Squeeze7768", "BinaryOp7769", "BinaryOp7770", "/Gather_293_output_0", "/Div_57_output_0", "/Unsqueeze_615_output_0", "/Slice_77_output_0", "/Neg_38_output_0", "/Unsqueeze_614_output_0", "/Slice_76_output_0", "/Concat_250_output_0", "/Mul_153_output_0", "/Add_98_output_0", "/FakeLinear_77_output_0", "/Unsqueeze_610_output_0", "/Unsqueeze_611_output_0", "/Concat_248_output_0", "/Reshape_173_output_0", "/k_norm_19/Cast_output_0", "/k_norm_19/Mul_1_output_0", "/Mul_154_output_0", "/Shape_269_output_0", "Shape7652", "Rank7654", "BinaryOp7656", "Unsqueeze7657", "BinaryOp7659", "Unsqueeze7660", "StridedSlice7663", "Squeeze7664", "BinaryOp7665", "BinaryOp7666", "/Gather_294_output_0", "/Div_58_output_0", "/Unsqueeze_617_output_0", "/Slice_79_output_0", "/Neg_39_output_0", "/Unsqueeze_616_output_0", "/Slice_78_output_0", "/Concat_251_output_0", "/Mul_155_output_0", "/Add_99_output_0", "/FakeLinear_78_output_0", "/Unsqueeze_612_output_0", "/Unsqueeze_613_output_0", "/Concat_249_output_0", "/Reshape_174_output_0", "/Reshape_179_output_0", "/FakeLinear_79_output_0", "/Add_101_output_0", "/post_attention_layernorm_19/Mul_1_output_0", "/mlp/gate_proj_19/FakeLinear_output_0", "/mlp/act_fn_19/Mul_output_0", "/mlp/up_proj_19/FakeLinear_output_0", "/mlp_19/Mul_output_0", "/mlp/down_proj_19/FakeLinear_output_0", "/Add_102_output_0", "/Reshape_180_output_0", "/input_layernorm_20/Mul_1_output_0", "/FakeLinear_80_output_0", "/Shape_280_output_0", "Shape7995", "Rank7997", "BinaryOp7999", "Unsqueeze8000", "BinaryOp8002", "Unsqueeze8003", "StridedSlice8006", "Squeeze8007", "BinaryOp8009", "/Gather_306_output_0", "/Unsqueeze_640_output_0", "Unsqueeze8017", "Unsqueeze8020", "StridedSlice8023", "Squeeze8024", "BinaryOp8025", "BinaryOp8026", "/Gather_307_output_0", "/Unsqueeze_641_output_0", "/Concat_260_output_0", "/Reshape_181_output_0", "/q_norm_20/Cast_output_0", "/q_norm_20/Mul_1_output_0", "/Mul_160_output_0", "/Shape_282_output_0", "Shape8145", "Rank8147", "BinaryOp8149", "Unsqueeze8150", "BinaryOp8152", "Unsqueeze8153", "StridedSlice8156", "Squeeze8157", "BinaryOp8158", "BinaryOp8159", "/Gather_308_output_0", "/Div_60_output_0", "/Unsqueeze_647_output_0", "/Slice_81_output_0", "/Neg_40_output_0", "/Unsqueeze_646_output_0", "/Slice_80_output_0", "/Concat_263_output_0", "/Mul_161_output_0", "/Add_103_output_0", "/FakeLinear_81_output_0", "/Unsqueeze_642_output_0", "/Unsqueeze_643_output_0", "/Concat_261_output_0", "/Reshape_182_output_0", "/k_norm_20/Cast_output_0", "/k_norm_20/Mul_1_output_0", "/Mul_162_output_0", "/Shape_283_output_0", "Shape8041", "Rank8043", "BinaryOp8045", "Unsqueeze8046", "BinaryOp8048", "Unsqueeze8049", "StridedSlice8052", "Squeeze8053", "BinaryOp8054", "BinaryOp8055", "/Gather_309_output_0", "/Div_61_output_0", "/Unsqueeze_649_output_0", "/Slice_83_output_0", "/Neg_41_output_0", "/Unsqueeze_648_output_0", "/Slice_82_output_0", "/Concat_264_output_0", "/Mul_163_output_0", "/Add_104_output_0", "/FakeLinear_82_output_0", "/Unsqueeze_644_output_0", "/Unsqueeze_645_output_0", "/Concat_262_output_0", "/Reshape_183_output_0", "/Reshape_188_output_0", "/FakeLinear_83_output_0", "/Add_106_output_0", "/post_attention_layernorm_20/Mul_1_output_0", "/mlp/gate_proj_20/FakeLinear_output_0", "/mlp/act_fn_20/Mul_output_0", "/mlp/up_proj_20/FakeLinear_output_0", "/mlp_20/Mul_output_0", "/mlp/down_proj_20/FakeLinear_output_0", "/Add_107_output_0", "/Reshape_189_output_0", "/input_layernorm_21/Mul_1_output_0", "/FakeLinear_84_output_0", "/Shape_294_output_0", "Shape8384", "Rank8386", "BinaryOp8388", "Unsqueeze8389", "BinaryOp8391", "Unsqueeze8392", "StridedSlice8395", "Squeeze8396", "BinaryOp8398", "/Gather_321_output_0", "/Unsqueeze_672_output_0", "Unsqueeze8406", "Unsqueeze8409", "StridedSlice8412", "Squeeze8413", "BinaryOp8414", "BinaryOp8415", "/Gather_322_output_0", "/Unsqueeze_673_output_0", "/Concat_273_output_0", "/Reshape_190_output_0", "/q_norm_21/Cast_output_0", "/q_norm_21/Mul_1_output_0", "/Mul_168_output_0", "/Shape_296_output_0", "Shape8534", "Rank8536", "BinaryOp8538", "Unsqueeze8539", "BinaryOp8541", "Unsqueeze8542", "StridedSlice8545", "Squeeze8546", "BinaryOp8547", "BinaryOp8548", "/Gather_323_output_0", "/Div_63_output_0", "/Unsqueeze_679_output_0", "/Slice_85_output_0", "/Neg_42_output_0", "/Unsqueeze_678_output_0", "/Slice_84_output_0", "/Concat_276_output_0", "/Mul_169_output_0", "/Add_108_output_0", "/FakeLinear_85_output_0", "/Unsqueeze_674_output_0", "/Unsqueeze_675_output_0", "/Concat_274_output_0", "/Reshape_191_output_0", "/k_norm_21/Cast_output_0", "/k_norm_21/Mul_1_output_0", "/Mul_170_output_0", "/Shape_297_output_0", "Shape8430", "Rank8432", "BinaryOp8434", "Unsqueeze8435", "BinaryOp8437", "Unsqueeze8438", "StridedSlice8441", "Squeeze8442", "BinaryOp8443", "BinaryOp8444", "/Gather_324_output_0", "/Div_64_output_0", "/Unsqueeze_681_output_0", "/Slice_87_output_0", "/Neg_43_output_0", "/Unsqueeze_680_output_0", "/Slice_86_output_0", "/Concat_277_output_0", "/Mul_171_output_0", "/Add_109_output_0", "/FakeLinear_86_output_0", "/Unsqueeze_676_output_0", "/Unsqueeze_677_output_0", "/Concat_275_output_0", "/Reshape_192_output_0", "/Reshape_197_output_0", "/FakeLinear_87_output_0", "/Add_111_output_0", "/post_attention_layernorm_21/Mul_1_output_0", "/mlp/gate_proj_21/FakeLinear_output_0", "/mlp/act_fn_21/Mul_output_0", "/mlp/up_proj_21/FakeLinear_output_0", "/mlp_21/Mul_output_0", "/mlp/down_proj_21/FakeLinear_output_0", "/Add_112_output_0", "/Reshape_198_output_0", "/input_layernorm_22/Mul_1_output_0", "/FakeLinear_88_output_0", "/Shape_308_output_0", "Shape8773", "Rank8775", "BinaryOp8777", "Unsqueeze8778", "BinaryOp8780", "Unsqueeze8781", "StridedSlice8784", "Squeeze8785", "BinaryOp8787", "/Gather_336_output_0", "/Unsqueeze_704_output_0", "Unsqueeze8795", "Unsqueeze8798", "StridedSlice8801", "Squeeze8802", "BinaryOp8803", "BinaryOp8804", "/Gather_337_output_0", "/Unsqueeze_705_output_0", "/Concat_286_output_0", "/Reshape_199_output_0", "/q_norm_22/Cast_output_0", "/q_norm_22/Mul_1_output_0", "/Mul_176_output_0", "/Shape_310_output_0", "Shape8923", "Rank8925", "BinaryOp8927", "Unsqueeze8928", "BinaryOp8930", "Unsqueeze8931", "StridedSlice8934", "Squeeze8935", "BinaryOp8936", "BinaryOp8937", "/Gather_338_output_0", "/Div_66_output_0", "/Unsqueeze_711_output_0", "/Slice_89_output_0", "/Neg_44_output_0", "/Unsqueeze_710_output_0", "/Slice_88_output_0", "/Concat_289_output_0", "/Mul_177_output_0", "/Add_113_output_0", "/FakeLinear_89_output_0", "/Unsqueeze_706_output_0", "/Unsqueeze_707_output_0", "/Concat_287_output_0", "/Reshape_200_output_0", "/k_norm_22/Cast_output_0", "/k_norm_22/Mul_1_output_0", "/Mul_178_output_0", "/Shape_311_output_0", "Shape8819", "Rank8821", "BinaryOp8823", "Unsqueeze8824", "BinaryOp8826", "Unsqueeze8827", "StridedSlice8830", "Squeeze8831", "BinaryOp8832", "BinaryOp8833", "/Gather_339_output_0", "/Div_67_output_0", "/Unsqueeze_713_output_0", "/Slice_91_output_0", "/Neg_45_output_0", "/Unsqueeze_712_output_0", "/Slice_90_output_0", "/Concat_290_output_0", "/Mul_179_output_0", "/Add_114_output_0", "/FakeLinear_90_output_0", "/Unsqueeze_708_output_0", "/Unsqueeze_709_output_0", "/Concat_288_output_0", "/Reshape_201_output_0", "/Reshape_206_output_0", "/FakeLinear_91_output_0", "/Add_116_output_0", "/post_attention_layernorm_22/Mul_1_output_0", "/mlp/gate_proj_22/FakeLinear_output_0", "/mlp/act_fn_22/Mul_output_0", "/mlp/up_proj_22/FakeLinear_output_0", "/mlp_22/Mul_output_0", "/mlp/down_proj_22/FakeLinear_output_0", "/Add_117_output_0", "/Reshape_207_output_0", "/input_layernorm_23/Mul_1_output_0", "/FakeLinear_92_output_0", "/Shape_322_output_0", "Shape9162", "Rank9164", "BinaryOp9166", "Unsqueeze9167", "BinaryOp9169", "Unsqueeze9170", "StridedSlice9173", "Squeeze9174", "BinaryOp9176", "/Gather_351_output_0", "/Unsqueeze_736_output_0", "Unsqueeze9184", "Unsqueeze9187", "StridedSlice9190", "Squeeze9191", "BinaryOp9192", "BinaryOp9193", "/Gather_352_output_0", "/Unsqueeze_737_output_0", "/Concat_299_output_0", "/Reshape_208_output_0", "/q_norm_23/Cast_output_0", "/q_norm_23/Mul_1_output_0", "/Mul_184_output_0", "/Shape_324_output_0", "Shape9312", "Rank9314", "BinaryOp9316", "Unsqueeze9317", "BinaryOp9319", "Unsqueeze9320", "StridedSlice9323", "Squeeze9324", "BinaryOp9325", "BinaryOp9326", "/Gather_353_output_0", "/Div_69_output_0", "/Unsqueeze_743_output_0", "/Slice_93_output_0", "/Neg_46_output_0", "/Unsqueeze_742_output_0", "/Slice_92_output_0", "/Concat_302_output_0", "/Mul_185_output_0", "/Add_118_output_0", "/FakeLinear_93_output_0", "/Unsqueeze_738_output_0", "/Unsqueeze_739_output_0", "/Concat_300_output_0", "/Reshape_209_output_0", "/k_norm_23/Cast_output_0", "/k_norm_23/Mul_1_output_0", "/Mul_186_output_0", "/Shape_325_output_0", "Shape9208", "Rank9210", "BinaryOp9212", "Unsqueeze9213", "BinaryOp9215", "Unsqueeze9216", "StridedSlice9219", "Squeeze9220", "BinaryOp9221", "BinaryOp9222", "/Gather_354_output_0", "/Div_70_output_0", "/Unsqueeze_745_output_0", "/Slice_95_output_0", "/Neg_47_output_0", "/Unsqueeze_744_output_0", "/Slice_94_output_0", "/Concat_303_output_0", "/Mul_187_output_0", "/Add_119_output_0", "/FakeLinear_94_output_0", "/Unsqueeze_740_output_0", "/Unsqueeze_741_output_0", "/Concat_301_output_0", "/Reshape_210_output_0", "/Reshape_215_output_0", "/FakeLinear_95_output_0", "/Add_121_output_0", "/post_attention_layernorm_23/Mul_1_output_0", "/mlp/gate_proj_23/FakeLinear_output_0", "/mlp/act_fn_23/Mul_output_0", "/mlp/up_proj_23/FakeLinear_output_0", "/mlp_23/Mul_output_0", "/mlp/down_proj_23/FakeLinear_output_0", "/Add_122_output_0", "/Reshape_216_output_0", "/input_layernorm_24/Mul_1_output_0", "/FakeLinear_96_output_0", "/Shape_336_output_0", "Shape9551", "Rank9553", "BinaryOp9555", "Unsqueeze9556", "BinaryOp9558", "Unsqueeze9559", "StridedSlice9562", "Squeeze9563", "BinaryOp9565", "/Gather_366_output_0", "/Unsqueeze_768_output_0", "Unsqueeze9573", "Unsqueeze9576", "StridedSlice9579", "Squeeze9580", "BinaryOp9581", "BinaryOp9582", "/Gather_367_output_0", "/Unsqueeze_769_output_0", "/Concat_312_output_0", "/Reshape_217_output_0", "/q_norm_24/Cast_output_0", "/q_norm_24/Mul_1_output_0", "/Mul_192_output_0", "/Shape_338_output_0", "Shape9701", "Rank9703", "BinaryOp9705", "Unsqueeze9706", "BinaryOp9708", "Unsqueeze9709", "StridedSlice9712", "Squeeze9713", "BinaryOp9714", "BinaryOp9715", "/Gather_368_output_0", "/Div_72_output_0", "/Unsqueeze_775_output_0", "/Slice_97_output_0", "/Neg_48_output_0", "/Unsqueeze_774_output_0", "/Slice_96_output_0", "/Concat_315_output_0", "/Mul_193_output_0", "/Add_123_output_0", "/FakeLinear_97_output_0", "/Unsqueeze_770_output_0", "/Unsqueeze_771_output_0", "/Concat_313_output_0", "/Reshape_218_output_0", "/k_norm_24/Cast_output_0", "/k_norm_24/Mul_1_output_0", "/Mul_194_output_0", "/Shape_339_output_0", "Shape9597", "Rank9599", "BinaryOp9601", "Unsqueeze9602", "BinaryOp9604", "Unsqueeze9605", "StridedSlice9608", "Squeeze9609", "BinaryOp9610", "BinaryOp9611", "/Gather_369_output_0", "/Div_73_output_0", "/Unsqueeze_777_output_0", "/Slice_99_output_0", "/Neg_49_output_0", "/Unsqueeze_776_output_0", "/Slice_98_output_0", "/Concat_316_output_0", "/Mul_195_output_0", "/Add_124_output_0", "/FakeLinear_98_output_0", "/Unsqueeze_772_output_0", "/Unsqueeze_773_output_0", "/Concat_314_output_0", "/Reshape_219_output_0", "/Reshape_224_output_0", "/FakeLinear_99_output_0", "/Add_126_output_0", "/post_attention_layernorm_24/Mul_1_output_0", "/mlp/gate_proj_24/FakeLinear_output_0", "/mlp/act_fn_24/Mul_output_0", "/mlp/up_proj_24/FakeLinear_output_0", "/mlp_24/Mul_output_0", "/mlp/down_proj_24/FakeLinear_output_0", "/Add_127_output_0", "/Reshape_225_output_0", "/input_layernorm_25/Mul_1_output_0", "/FakeLinear_100_output_0", "/Shape_350_output_0", "Shape9940", "Rank9942", "BinaryOp9944", "Unsqueeze9945", "BinaryOp9947", "Unsqueeze9948", "StridedSlice9951", "Squeeze9952", "BinaryOp9954", "/Gather_381_output_0", "/Unsqueeze_800_output_0", "Unsqueeze9962", "Unsqueeze9965", "StridedSlice9968", "Squeeze9969", "BinaryOp9970", "BinaryOp9971", "/Gather_382_output_0", "/Unsqueeze_801_output_0", "/Concat_325_output_0", "/Reshape_226_output_0", "/q_norm_25/Cast_output_0", "/q_norm_25/Mul_1_output_0", "/Mul_200_output_0", "/Shape_352_output_0", "Shape10090", "Rank10092", "BinaryOp10094", "Unsqueeze10095", "BinaryOp10097", "Unsqueeze10098", "StridedSlice10101", "Squeeze10102", "BinaryOp10103", "BinaryOp10104", "/Gather_383_output_0", "/Div_75_output_0", "/Unsqueeze_807_output_0", "/Slice_101_output_0", "/Neg_50_output_0", "/Unsqueeze_806_output_0", "/Slice_100_output_0", "/Concat_328_output_0", "/Mul_201_output_0", "/Add_128_output_0", "/FakeLinear_101_output_0", "/Unsqueeze_802_output_0", "/Unsqueeze_803_output_0", "/Concat_326_output_0", "/Reshape_227_output_0", "/k_norm_25/Cast_output_0", "/k_norm_25/Mul_1_output_0", "/Mul_202_output_0", "/Shape_353_output_0", "Shape9986", "Rank9988", "BinaryOp9990", "Unsqueeze9991", "BinaryOp9993", "Unsqueeze9994", "StridedSlice9997", "Squeeze9998", "BinaryOp9999", "BinaryOp10000", "/Gather_384_output_0", "/Div_76_output_0", "/Unsqueeze_809_output_0", "/Slice_103_output_0", "/Neg_51_output_0", "/Unsqueeze_808_output_0", "/Slice_102_output_0", "/Concat_329_output_0", "/Mul_203_output_0", "/Add_129_output_0", "/FakeLinear_102_output_0", "/Unsqueeze_804_output_0", "/Unsqueeze_805_output_0", "/Concat_327_output_0", "/Reshape_228_output_0", "/Reshape_233_output_0", "/FakeLinear_103_output_0", "/Add_131_output_0", "/post_attention_layernorm_25/Mul_1_output_0", "/mlp/gate_proj_25/FakeLinear_output_0", "/mlp/act_fn_25/Mul_output_0", "/mlp/up_proj_25/FakeLinear_output_0", "/mlp_25/Mul_output_0", "/mlp/down_proj_25/FakeLinear_output_0", "/Add_132_output_0", "/Reshape_234_output_0", "/input_layernorm_26/Mul_1_output_0", "/FakeLinear_104_output_0", "/Shape_364_output_0", "Shape10329", "Rank10331", "BinaryOp10333", "Unsqueeze10334", "BinaryOp10336", "Unsqueeze10337", "StridedSlice10340", "Squeeze10341", "BinaryOp10343", "/Gather_396_output_0", "/Unsqueeze_832_output_0", "Unsqueeze10351", "Unsqueeze10354", "StridedSlice10357", "Squeeze10358", "BinaryOp10359", "BinaryOp10360", "/Gather_397_output_0", "/Unsqueeze_833_output_0", "/Concat_338_output_0", "/Reshape_235_output_0", "/q_norm_26/Cast_output_0", "/q_norm_26/Mul_1_output_0", "/Mul_208_output_0", "/Shape_366_output_0", "Shape10479", "Rank10481", "BinaryOp10483", "Unsqueeze10484", "BinaryOp10486", "Unsqueeze10487", "StridedSlice10490", "Squeeze10491", "BinaryOp10492", "BinaryOp10493", "/Gather_398_output_0", "/Div_78_output_0", "/Unsqueeze_839_output_0", "/Slice_105_output_0", "/Neg_52_output_0", "/Unsqueeze_838_output_0", "/Slice_104_output_0", "/Concat_341_output_0", "/Mul_209_output_0", "/Add_133_output_0", "/FakeLinear_105_output_0", "/Unsqueeze_834_output_0", "/Unsqueeze_835_output_0", "/Concat_339_output_0", "/Reshape_236_output_0", "/k_norm_26/Cast_output_0", "/k_norm_26/Mul_1_output_0", "/Mul_210_output_0", "/Shape_367_output_0", "Shape10375", "Rank10377", "BinaryOp10379", "Unsqueeze10380", "BinaryOp10382", "Unsqueeze10383", "StridedSlice10386", "Squeeze10387", "BinaryOp10388", "BinaryOp10389", "/Gather_399_output_0", "/Div_79_output_0", "/Unsqueeze_841_output_0", "/Slice_107_output_0", "/Neg_53_output_0", "/Unsqueeze_840_output_0", "/Slice_106_output_0", "/Concat_342_output_0", "/Mul_211_output_0", "/Add_134_output_0", "/FakeLinear_106_output_0", "/Unsqueeze_836_output_0", "/Unsqueeze_837_output_0", "/Concat_340_output_0", "/Reshape_237_output_0", "/Reshape_242_output_0", "/FakeLinear_107_output_0", "/Add_136_output_0", "/post_attention_layernorm_26/Mul_1_output_0", "/mlp/gate_proj_26/FakeLinear_output_0", "/mlp/act_fn_26/Mul_output_0", "/mlp/up_proj_26/FakeLinear_output_0", "/mlp_26/Mul_output_0", "/mlp/down_proj_26/FakeLinear_output_0", "/Add_137_output_0", "/Reshape_243_output_0", "/input_layernorm_27/Mul_1_output_0", "/FakeLinear_108_output_0", "/Shape_378_output_0", "Shape10718", "Rank10720", "BinaryOp10722", "Unsqueeze10723", "BinaryOp10725", "Unsqueeze10726", "StridedSlice10729", "Squeeze10730", "BinaryOp10732", "/Gather_411_output_0", "/Unsqueeze_864_output_0", "Unsqueeze10740", "Unsqueeze10743", "StridedSlice10746", "Squeeze10747", "BinaryOp10748", "BinaryOp10749", "/Gather_412_output_0", "/Unsqueeze_865_output_0", "/Concat_351_output_0", "/Reshape_244_output_0", "/q_norm_27/Cast_output_0", "/q_norm_27/Mul_1_output_0", "/Mul_216_output_0", "/Shape_380_output_0", "Shape10868", "Rank10870", "BinaryOp10872", "Unsqueeze10873", "BinaryOp10875", "Unsqueeze10876", "StridedSlice10879", "Squeeze10880", "BinaryOp10881", "BinaryOp10882", "/Gather_413_output_0", "/Div_81_output_0", "/Unsqueeze_871_output_0", "/Slice_109_output_0", "/Neg_54_output_0", "/Unsqueeze_870_output_0", "/Slice_108_output_0", "/Concat_354_output_0", "/Mul_217_output_0", "/Add_138_output_0", "/FakeLinear_109_output_0", "/Unsqueeze_866_output_0", "/Unsqueeze_867_output_0", "/Concat_352_output_0", "/Reshape_245_output_0", "/k_norm_27/Cast_output_0", "/k_norm_27/Mul_1_output_0", "/Mul_218_output_0", "/Shape_381_output_0", "Shape10764", "Rank10766", "BinaryOp10768", "Unsqueeze10769", "BinaryOp10771", "Unsqueeze10772", "StridedSlice10775", "Squeeze10776", "BinaryOp10777", "BinaryOp10778", "/Gather_414_output_0", "/Div_82_output_0", "/Unsqueeze_873_output_0", "/Slice_111_output_0", "/Neg_55_output_0", "/Unsqueeze_872_output_0", "/Slice_110_output_0", "/Concat_355_output_0", "/Mul_219_output_0", "/Add_139_output_0", "/FakeLinear_110_output_0", "/Unsqueeze_868_output_0", "/Unsqueeze_869_output_0", "/Concat_353_output_0", "/Reshape_246_output_0", "/Reshape_251_output_0", "/FakeLinear_111_output_0", "/Add_141_output_0", "/post_attention_layernorm_27/Mul_1_output_0", "/mlp/gate_proj_27/FakeLinear_output_0", "/mlp/act_fn_27/Mul_output_0", "/mlp/up_proj_27/FakeLinear_output_0", "/mlp_27/Mul_output_0", "/mlp/down_proj_27/FakeLinear_output_0", "/Add_142_output_0", "/Reshape_252_output_0", "/input_layernorm_28/Mul_1_output_0", "/FakeLinear_112_output_0", "/Shape_392_output_0", "Shape11107", "Rank11109", "BinaryOp11111", "Unsqueeze11112", "BinaryOp11114", "Unsqueeze11115", "StridedSlice11118", "Squeeze11119", "BinaryOp11121", "/Gather_426_output_0", "/Unsqueeze_896_output_0", "Unsqueeze11129", "Unsqueeze11132", "StridedSlice11135", "Squeeze11136", "BinaryOp11137", "BinaryOp11138", "/Gather_427_output_0", "/Unsqueeze_897_output_0", "/Concat_364_output_0", "/Reshape_253_output_0", "/q_norm_28/Cast_output_0", "/q_norm_28/Mul_1_output_0", "/Mul_224_output_0", "/Shape_394_output_0", "Shape11257", "Rank11259", "BinaryOp11261", "Unsqueeze11262", "BinaryOp11264", "Unsqueeze11265", "StridedSlice11268", "Squeeze11269", "BinaryOp11270", "BinaryOp11271", "/Gather_428_output_0", "/Div_84_output_0", "/Unsqueeze_903_output_0", "/Slice_113_output_0", "/Neg_56_output_0", "/Unsqueeze_902_output_0", "/Slice_112_output_0", "/Concat_367_output_0", "/Mul_225_output_0", "/Add_143_output_0", "/FakeLinear_113_output_0", "/Unsqueeze_898_output_0", "/Unsqueeze_899_output_0", "/Concat_365_output_0", "/Reshape_254_output_0", "/k_norm_28/Cast_output_0", "/k_norm_28/Mul_1_output_0", "/Mul_226_output_0", "/Shape_395_output_0", "Shape11153", "Rank11155", "BinaryOp11157", "Unsqueeze11158", "BinaryOp11160", "Unsqueeze11161", "StridedSlice11164", "Squeeze11165", "BinaryOp11166", "BinaryOp11167", "/Gather_429_output_0", "/Div_85_output_0", "/Unsqueeze_905_output_0", "/Slice_115_output_0", "/Neg_57_output_0", "/Unsqueeze_904_output_0", "/Slice_114_output_0", "/Concat_368_output_0", "/Mul_227_output_0", "/Add_144_output_0", "/FakeLinear_114_output_0", "/Unsqueeze_900_output_0", "/Unsqueeze_901_output_0", "/Concat_366_output_0", "/Reshape_255_output_0", "/Reshape_260_output_0", "/FakeLinear_115_output_0", "/Add_146_output_0", "/post_attention_layernorm_28/Mul_1_output_0", "/mlp/gate_proj_28/FakeLinear_output_0", "/mlp/act_fn_28/Mul_output_0", "/mlp/up_proj_28/FakeLinear_output_0", "/mlp_28/Mul_output_0", "/mlp/down_proj_28/FakeLinear_output_0", "/Add_147_output_0", "/Reshape_261_output_0", "/input_layernorm_29/Mul_1_output_0", "/FakeLinear_116_output_0", "/Shape_406_output_0", "Shape11496", "Rank11498", "BinaryOp11500", "Unsqueeze11501", "BinaryOp11503", "Unsqueeze11504", "StridedSlice11507", "Squeeze11508", "BinaryOp11510", "/Gather_441_output_0", "/Unsqueeze_928_output_0", "Unsqueeze11518", "Unsqueeze11521", "StridedSlice11524", "Squeeze11525", "BinaryOp11526", "BinaryOp11527", "/Gather_442_output_0", "/Unsqueeze_929_output_0", "/Concat_377_output_0", "/Reshape_262_output_0", "/q_norm_29/Cast_output_0", "/q_norm_29/Mul_1_output_0", "/Mul_232_output_0", "/Shape_408_output_0", "Shape11646", "Rank11648", "BinaryOp11650", "Unsqueeze11651", "BinaryOp11653", "Unsqueeze11654", "StridedSlice11657", "Squeeze11658", "BinaryOp11659", "BinaryOp11660", "/Gather_443_output_0", "/Div_87_output_0", "/Unsqueeze_935_output_0", "/Slice_117_output_0", "/Neg_58_output_0", "/Unsqueeze_934_output_0", "/Slice_116_output_0", "/Concat_380_output_0", "/Mul_233_output_0", "/Add_148_output_0", "/FakeLinear_117_output_0", "/Unsqueeze_930_output_0", "/Unsqueeze_931_output_0", "/Concat_378_output_0", "/Reshape_263_output_0", "/k_norm_29/Cast_output_0", "/k_norm_29/Mul_1_output_0", "/Mul_234_output_0", "/Shape_409_output_0", "Shape11542", "Rank11544", "BinaryOp11546", "Unsqueeze11547", "BinaryOp11549", "Unsqueeze11550", "StridedSlice11553", "Squeeze11554", "BinaryOp11555", "BinaryOp11556", "/Gather_444_output_0", "/Div_88_output_0", "/Unsqueeze_937_output_0", "/Slice_119_output_0", "/Neg_59_output_0", "/Unsqueeze_936_output_0", "/Slice_118_output_0", "/Concat_381_output_0", "/Mul_235_output_0", "/Add_149_output_0", "/FakeLinear_118_output_0", "/Unsqueeze_932_output_0", "/Unsqueeze_933_output_0", "/Concat_379_output_0", "/Reshape_264_output_0", "/Reshape_269_output_0", "/FakeLinear_119_output_0", "/Add_151_output_0", "/post_attention_layernorm_29/Mul_1_output_0", "/mlp/gate_proj_29/FakeLinear_output_0", "/mlp/act_fn_29/Mul_output_0", "/mlp/up_proj_29/FakeLinear_output_0", "/mlp_29/Mul_output_0", "/mlp/down_proj_29/FakeLinear_output_0", "/Add_152_output_0", "/Reshape_270_output_0", "/input_layernorm_30/Mul_1_output_0", "/FakeLinear_120_output_0", "/Shape_420_output_0", "Shape11885", "Rank11887", "BinaryOp11889", "Unsqueeze11890", "BinaryOp11892", "Unsqueeze11893", "StridedSlice11896", "Squeeze11897", "BinaryOp11899", "/Gather_456_output_0", "/Unsqueeze_960_output_0", "Unsqueeze11907", "Unsqueeze11910", "StridedSlice11913", "Squeeze11914", "BinaryOp11915", "BinaryOp11916", "/Gather_457_output_0", "/Unsqueeze_961_output_0", "/Concat_390_output_0", "/Reshape_271_output_0", "/q_norm_30/Cast_output_0", "/q_norm_30/Mul_1_output_0", "/Mul_240_output_0", "/Shape_422_output_0", "Shape12035", "Rank12037", "BinaryOp12039", "Unsqueeze12040", "BinaryOp12042", "Unsqueeze12043", "StridedSlice12046", "Squeeze12047", "BinaryOp12048", "BinaryOp12049", "/Gather_458_output_0", "/Div_90_output_0", "/Unsqueeze_967_output_0", "/Slice_121_output_0", "/Neg_60_output_0", "/Unsqueeze_966_output_0", "/Slice_120_output_0", "/Concat_393_output_0", "/Mul_241_output_0", "/Add_153_output_0", "/FakeLinear_121_output_0", "/Unsqueeze_962_output_0", "/Unsqueeze_963_output_0", "/Concat_391_output_0", "/Reshape_272_output_0", "/k_norm_30/Cast_output_0", "/k_norm_30/Mul_1_output_0", "/Mul_242_output_0", "/Shape_423_output_0", "Shape11931", "Rank11933", "BinaryOp11935", "Unsqueeze11936", "BinaryOp11938", "Unsqueeze11939", "StridedSlice11942", "Squeeze11943", "BinaryOp11944", "BinaryOp11945", "/Gather_459_output_0", "/Div_91_output_0", "/Unsqueeze_969_output_0", "/Slice_123_output_0", "/Neg_61_output_0", "/Unsqueeze_968_output_0", "/Slice_122_output_0", "/Concat_394_output_0", "/Mul_243_output_0", "/Add_154_output_0", "/FakeLinear_122_output_0", "/Unsqueeze_964_output_0", "/Unsqueeze_965_output_0", "/Concat_392_output_0", "/Reshape_273_output_0", "/Reshape_278_output_0", "/FakeLinear_123_output_0", "/Add_156_output_0", "/post_attention_layernorm_30/Mul_1_output_0", "/mlp/gate_proj_30/FakeLinear_output_0", "/mlp/act_fn_30/Mul_output_0", "/mlp/up_proj_30/FakeLinear_output_0", "/mlp_30/Mul_output_0", "/mlp/down_proj_30/FakeLinear_output_0", "/Add_157_output_0", "/Reshape_279_output_0", "/input_layernorm_31/Mul_1_output_0", "/FakeLinear_124_output_0", "/Shape_434_output_0", "Shape12274", "Rank12276", "BinaryOp12278", "Unsqueeze12279", "BinaryOp12281", "Unsqueeze12282", "StridedSlice12285", "Squeeze12286", "BinaryOp12288", "/Gather_471_output_0", "/Unsqueeze_992_output_0", "Unsqueeze12296", "Unsqueeze12299", "StridedSlice12302", "Squeeze12303", "BinaryOp12304", "BinaryOp12305", "/Gather_472_output_0", "/Unsqueeze_993_output_0", "/Concat_403_output_0", "/Reshape_280_output_0", "/q_norm_31/Cast_output_0", "/q_norm_31/Mul_1_output_0", "/Mul_248_output_0", "/Shape_436_output_0", "Shape12424", "Rank12426", "BinaryOp12428", "Unsqueeze12429", "BinaryOp12431", "Unsqueeze12432", "StridedSlice12435", "Squeeze12436", "BinaryOp12437", "BinaryOp12438", "/Gather_473_output_0", "/Div_93_output_0", "/Unsqueeze_999_output_0", "/Slice_125_output_0", "/Neg_62_output_0", "/Unsqueeze_998_output_0", "/Slice_124_output_0", "/Concat_406_output_0", "/Mul_249_output_0", "/Add_158_output_0", "/FakeLinear_125_output_0", "/Unsqueeze_994_output_0", "/Unsqueeze_995_output_0", "/Concat_404_output_0", "/Reshape_281_output_0", "/k_norm_31/Cast_output_0", "/k_norm_31/Mul_1_output_0", "/Mul_250_output_0", "/Shape_437_output_0", "Shape12320", "Rank12322", "BinaryOp12324", "Unsqueeze12325", "BinaryOp12327", "Unsqueeze12328", "StridedSlice12331", "Squeeze12332", "BinaryOp12333", "BinaryOp12334", "/Gather_474_output_0", "/Div_94_output_0", "/Unsqueeze_1001_output_0", "/Slice_127_output_0", "/Neg_63_output_0", "/Unsqueeze_1000_output_0", "/Slice_126_output_0", "/Concat_407_output_0", "/Mul_251_output_0", "/Add_159_output_0", "/FakeLinear_126_output_0", "/Unsqueeze_996_output_0", "/Unsqueeze_997_output_0", "/Concat_405_output_0", "/Reshape_282_output_0", "/Reshape_287_output_0", "/FakeLinear_127_output_0", "/Add_161_output_0", "/post_attention_layernorm_31/Mul_1_output_0", "/mlp/gate_proj_31/FakeLinear_output_0", "/mlp/act_fn_31/Mul_output_0", "/mlp/up_proj_31/FakeLinear_output_0", "/mlp_31/Mul_output_0", "/mlp/down_proj_31/FakeLinear_output_0", "/Add_162_output_0", "/Reshape_288_output_0", "/input_layernorm_32/Mul_1_output_0", "/FakeLinear_128_output_0", "/Shape_448_output_0", "Shape12663", "Rank12665", "BinaryOp12667", "Unsqueeze12668", "BinaryOp12670", "Unsqueeze12671", "StridedSlice12674", "Squeeze12675", "BinaryOp12677", "/Gather_486_output_0", "/Unsqueeze_1024_output_0", "Unsqueeze12685", "Unsqueeze12688", "StridedSlice12691", "Squeeze12692", "BinaryOp12693", "BinaryOp12694", "/Gather_487_output_0", "/Unsqueeze_1025_output_0", "/Concat_416_output_0", "/Reshape_289_output_0", "/q_norm_32/Cast_output_0", "/q_norm_32/Mul_1_output_0", "/Mul_256_output_0", "/Shape_450_output_0", "Shape12813", "Rank12815", "BinaryOp12817", "Unsqueeze12818", "BinaryOp12820", "Unsqueeze12821", "StridedSlice12824", "Squeeze12825", "BinaryOp12826", "BinaryOp12827", "/Gather_488_output_0", "/Div_96_output_0", "/Unsqueeze_1031_output_0", "/Slice_129_output_0", "/Neg_64_output_0", "/Unsqueeze_1030_output_0", "/Slice_128_output_0", "/Concat_419_output_0", "/Mul_257_output_0", "/Add_163_output_0", "/FakeLinear_129_output_0", "/Unsqueeze_1026_output_0", "/Unsqueeze_1027_output_0", "/Concat_417_output_0", "/Reshape_290_output_0", "/k_norm_32/Cast_output_0", "/k_norm_32/Mul_1_output_0", "/Mul_258_output_0", "/Shape_451_output_0", "Shape12709", "Rank12711", "BinaryOp12713", "Unsqueeze12714", "BinaryOp12716", "Unsqueeze12717", "StridedSlice12720", "Squeeze12721", "BinaryOp12722", "BinaryOp12723", "/Gather_489_output_0", "/Div_97_output_0", "/Unsqueeze_1033_output_0", "/Slice_131_output_0", "/Neg_65_output_0", "/Unsqueeze_1032_output_0", "/Slice_130_output_0", "/Concat_420_output_0", "/Mul_259_output_0", "/Add_164_output_0", "/FakeLinear_130_output_0", "/Unsqueeze_1028_output_0", "/Unsqueeze_1029_output_0", "/Concat_418_output_0", "/Reshape_291_output_0", "/Reshape_296_output_0", "/FakeLinear_131_output_0", "/Add_166_output_0", "/post_attention_layernorm_32/Mul_1_output_0", "/mlp/gate_proj_32/FakeLinear_output_0", "/mlp/act_fn_32/Mul_output_0", "/mlp/up_proj_32/FakeLinear_output_0", "/mlp_32/Mul_output_0", "/mlp/down_proj_32/FakeLinear_output_0", "/Add_167_output_0", "/Reshape_297_output_0", "/input_layernorm_33/Mul_1_output_0", "/FakeLinear_132_output_0", "/Shape_462_output_0", "Shape13052", "Rank13054", "BinaryOp13056", "Unsqueeze13057", "BinaryOp13059", "Unsqueeze13060", "StridedSlice13063", "Squeeze13064", "BinaryOp13066", "/Gather_501_output_0", "/Unsqueeze_1056_output_0", "Unsqueeze13074", "Unsqueeze13077", "StridedSlice13080", "Squeeze13081", "BinaryOp13082", "BinaryOp13083", "/Gather_502_output_0", "/Unsqueeze_1057_output_0", "/Concat_429_output_0", "/Reshape_298_output_0", "/q_norm_33/Cast_output_0", "/q_norm_33/Mul_1_output_0", "/Mul_264_output_0", "/Shape_464_output_0", "Shape13202", "Rank13204", "BinaryOp13206", "Unsqueeze13207", "BinaryOp13209", "Unsqueeze13210", "StridedSlice13213", "Squeeze13214", "BinaryOp13215", "BinaryOp13216", "/Gather_503_output_0", "/Div_99_output_0", "/Unsqueeze_1063_output_0", "/Slice_133_output_0", "/Neg_66_output_0", "/Unsqueeze_1062_output_0", "/Slice_132_output_0", "/Concat_432_output_0", "/Mul_265_output_0", "/Add_168_output_0", "/FakeLinear_133_output_0", "/Unsqueeze_1058_output_0", "/Unsqueeze_1059_output_0", "/Concat_430_output_0", "/Reshape_299_output_0", "/k_norm_33/Cast_output_0", "/k_norm_33/Mul_1_output_0", "/Mul_266_output_0", "/Shape_465_output_0", "Shape13098", "Rank13100", "BinaryOp13102", "Unsqueeze13103", "BinaryOp13105", "Unsqueeze13106", "StridedSlice13109", "Squeeze13110", "BinaryOp13111", "BinaryOp13112", "/Gather_504_output_0", "/Div_100_output_0", "/Unsqueeze_1065_output_0", "/Slice_135_output_0", "/Neg_67_output_0", "/Unsqueeze_1064_output_0", "/Slice_134_output_0", "/Concat_433_output_0", "/Mul_267_output_0", "/Add_169_output_0", "/FakeLinear_134_output_0", "/Unsqueeze_1060_output_0", "/Unsqueeze_1061_output_0", "/Concat_431_output_0", "/Reshape_300_output_0", "/Reshape_305_output_0", "/FakeLinear_135_output_0", "/Add_171_output_0", "/post_attention_layernorm_33/Mul_1_output_0", "/mlp/gate_proj_33/FakeLinear_output_0", "/mlp/act_fn_33/Mul_output_0", "/mlp/up_proj_33/FakeLinear_output_0", "/mlp_33/Mul_output_0", "/mlp/down_proj_33/FakeLinear_output_0", "/Add_172_output_0", "/Reshape_306_output_0", "/input_layernorm_34/Mul_1_output_0", "/FakeLinear_136_output_0", "/Shape_476_output_0", "Shape13441", "Rank13443", "BinaryOp13445", "Unsqueeze13446", "BinaryOp13448", "Unsqueeze13449", "StridedSlice13452", "Squeeze13453", "BinaryOp13455", "/Gather_516_output_0", "/Unsqueeze_1088_output_0", "Unsqueeze13463", "Unsqueeze13466", "StridedSlice13469", "Squeeze13470", "BinaryOp13471", "BinaryOp13472", "/Gather_517_output_0", "/Unsqueeze_1089_output_0", "/Concat_442_output_0", "/Reshape_307_output_0", "/q_norm_34/Cast_output_0", "/q_norm_34/Mul_1_output_0", "/Mul_272_output_0", "/Shape_478_output_0", "Shape13591", "Rank13593", "BinaryOp13595", "Unsqueeze13596", "BinaryOp13598", "Unsqueeze13599", "StridedSlice13602", "Squeeze13603", "BinaryOp13604", "BinaryOp13605", "/Gather_518_output_0", "/Div_102_output_0", "/Unsqueeze_1095_output_0", "/Slice_137_output_0", "/Neg_68_output_0", "/Unsqueeze_1094_output_0", "/Slice_136_output_0", "/Concat_445_output_0", "/Mul_273_output_0", "/Add_173_output_0", "/FakeLinear_137_output_0", "/Unsqueeze_1090_output_0", "/Unsqueeze_1091_output_0", "/Concat_443_output_0", "/Reshape_308_output_0", "/k_norm_34/Cast_output_0", "/k_norm_34/Mul_1_output_0", "/Mul_274_output_0", "/Shape_479_output_0", "Shape13487", "Rank13489", "BinaryOp13491", "Unsqueeze13492", "BinaryOp13494", "Unsqueeze13495", "StridedSlice13498", "Squeeze13499", "BinaryOp13500", "BinaryOp13501", "/Gather_519_output_0", "/Div_103_output_0", "/Unsqueeze_1097_output_0", "/Slice_139_output_0", "/Neg_69_output_0", "/Unsqueeze_1096_output_0", "/Slice_138_output_0", "/Concat_446_output_0", "/Mul_275_output_0", "/Add_174_output_0", "/FakeLinear_138_output_0", "/Unsqueeze_1092_output_0", "/Unsqueeze_1093_output_0", "/Concat_444_output_0", "/Reshape_309_output_0", "/Reshape_314_output_0", "/FakeLinear_139_output_0", "/Add_176_output_0", "/post_attention_layernorm_34/Mul_1_output_0", "/mlp/gate_proj_34/FakeLinear_output_0", "/mlp/act_fn_34/Mul_output_0", "/mlp/up_proj_34/FakeLinear_output_0", "/mlp_34/Mul_output_0", "/mlp/down_proj_34/FakeLinear_output_0", "/Add_177_output_0", "/Reshape_315_output_0", "/input_layernorm_35/Mul_1_output_0", "/FakeLinear_140_output_0", "/Shape_490_output_0", "Shape13830", "Rank13832", "BinaryOp13834", "Unsqueeze13835", "BinaryOp13837", "Unsqueeze13838", "StridedSlice13841", "Squeeze13842", "BinaryOp13844", "/Gather_531_output_0", "/Unsqueeze_1120_output_0", "Unsqueeze13852", "Unsqueeze13855", "StridedSlice13858", "Squeeze13859", "BinaryOp13860", "BinaryOp13861", "/Gather_532_output_0", "/Unsqueeze_1121_output_0", "/Concat_455_output_0", "/Reshape_316_output_0", "/q_norm_35/Cast_output_0", "/q_norm_35/Mul_1_output_0", "/Mul_280_output_0", "/Shape_492_output_0", "Shape13948", "Rank13950", "BinaryOp13952", "Unsqueeze13953", "BinaryOp13955", "Unsqueeze13956", "StridedSlice13959", "Squeeze13960", "BinaryOp13961", "BinaryOp13962", "/Gather_533_output_0", "/Div_105_output_0", "/Unsqueeze_1127_output_0", "/Slice_141_output_0", "/Neg_70_output_0", "/Unsqueeze_1126_output_0", "/Slice_140_output_0", "/Concat_458_output_0", "/Mul_281_output_0", "/Add_178_output_0", "/FakeLinear_141_output_0", "/Unsqueeze_1122_output_0", "/Unsqueeze_1123_output_0", "/Concat_456_output_0", "/Reshape_317_output_0", "/k_norm_35/Cast_output_0", "/k_norm_35/Mul_1_output_0", "/Mul_282_output_0", "/Shape_493_output_0", "Shape13876", "Rank13878", "BinaryOp13880", "Unsqueeze13881", "BinaryOp13883", "Unsqueeze13884", "StridedSlice13887", "Squeeze13888", "BinaryOp13889", "BinaryOp13890", "/Gather_534_output_0", "/Div_106_output_0", "/Unsqueeze_1129_output_0", "/Slice_143_output_0", "/Neg_71_output_0", "/Unsqueeze_1128_output_0", "/Slice_142_output_0", "/Concat_459_output_0", "/Mul_283_output_0", "/Add_179_output_0", "/FakeLinear_142_output_0", "/Unsqueeze_1124_output_0", "/Unsqueeze_1125_output_0", "/Concat_457_output_0", "/Reshape_318_output_0", "/Reshape_323_output_0", "/FakeLinear_143_output_0", "/Add_181_output_0", "/post_attention_layernorm_35/Mul_1_output_0", "/mlp/gate_proj_35/FakeLinear_output_0", "/mlp/act_fn_35/Mul_output_0", "/mlp/up_proj_35/FakeLinear_output_0", "/mlp_35/Mul_output_0", "/mlp/down_proj_35/FakeLinear_output_0", "/Add_182_output_0", "/Slice_144_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/layers.28/self_attn/q_proj/Linear/pre_reshape", "/layers.28/self_attn/q_proj/Linear/pre_convert", "/layers.28/self_attn/q_proj/Linear", "/layers.28/self_attn/q_proj/Linear/post_convert", "/layers.28/self_attn/k_proj/Linear/pre_reshape", "/layers.28/self_attn/k_proj/Linear/pre_convert", "/layers.28/self_attn/k_proj/Linear", "/layers.28/self_attn/k_proj/Linear/post_convert", "/layers.28/self_attn/v_proj/Linear/pre_reshape", "/layers.28/self_attn/v_proj/Linear/pre_convert", "/layers.28/self_attn/v_proj/Linear", "/layers.28/self_attn/v_proj/Linear/post_convert", "/layers.28/self_attn/o_proj/Linear/pre_reshape", "/layers.28/self_attn/o_proj/Linear/pre_convert", "/layers.28/self_attn/o_proj/Linear", "/layers.28/self_attn/o_proj/Linear/post_convert", "/layers.28/mlp/gate_proj/Linear/pre_reshape", "/layers.28/mlp/gate_proj/Linear/pre_convert", "/layers.28/mlp/gate_proj/Linear", "/layers.28/mlp/gate_proj/Linear/post_convert", "/layers.28/mlp/up_proj/Linear/pre_reshape", "/layers.28/mlp/up_proj/Linear/pre_convert", "/layers.28/mlp/up_proj/Linear", "/layers.28/mlp/up_proj/Linear/post_convert", "/layers.28/mlp/down_proj/Linear/pre_reshape", "/layers.28/mlp/down_proj/Linear/pre_convert", "/layers.28/mlp/down_proj/Linear", "/layers.28/mlp/down_proj/Linear/post_convert", "/layers.29/self_attn/q_proj/Linear/pre_reshape", "/layers.29/self_attn/q_proj/Linear/pre_convert", "/layers.29/self_attn/q_proj/Linear", "/layers.29/self_attn/q_proj/Linear/post_convert", "/layers.29/self_attn/k_proj/Linear/pre_reshape", "/layers.29/self_attn/k_proj/Linear/pre_convert", "/layers.29/self_attn/k_proj/Linear", "/layers.29/self_attn/k_proj/Linear/post_convert", "/layers.29/self_attn/v_proj/Linear/pre_reshape", "/layers.29/self_attn/v_proj/Linear/pre_convert", "/layers.29/self_attn/v_proj/Linear", "/layers.29/self_attn/v_proj/Linear/post_convert", "/layers.29/self_attn/o_proj/Linear/pre_reshape", "/layers.29/self_attn/o_proj/Linear/pre_convert", "/layers.29/self_attn/o_proj/Linear", "/layers.29/self_attn/o_proj/Linear/post_convert", "/layers.29/mlp/gate_proj/Linear/pre_reshape", "/layers.29/mlp/gate_proj/Linear/pre_convert", "/layers.29/mlp/gate_proj/Linear", "/layers.29/mlp/gate_proj/Linear/post_convert", "/layers.29/mlp/up_proj/Linear/pre_reshape", "/layers.29/mlp/up_proj/Linear/pre_convert", "/layers.29/mlp/up_proj/Linear", "/layers.29/mlp/up_proj/Linear/post_convert", "/layers.29/mlp/down_proj/Linear/pre_reshape", "/layers.29/mlp/down_proj/Linear/pre_convert", "/layers.29/mlp/down_proj/Linear", "/layers.29/mlp/down_proj/Linear/post_convert", "/layers.30/self_attn/q_proj/Linear/pre_reshape", "/layers.30/self_attn/q_proj/Linear/pre_convert", "/layers.30/self_attn/q_proj/Linear", "/layers.30/self_attn/q_proj/Linear/post_convert", "/layers.30/self_attn/k_proj/Linear/pre_reshape", "/layers.30/self_attn/k_proj/Linear/pre_convert", "/layers.30/self_attn/k_proj/Linear", "/layers.30/self_attn/k_proj/Linear/post_convert", "/layers.30/self_attn/v_proj/Linear/pre_reshape", "/layers.30/self_attn/v_proj/Linear/pre_convert", "/layers.30/self_attn/v_proj/Linear", "/layers.30/self_attn/v_proj/Linear/post_convert", "/layers.30/self_attn/o_proj/Linear/pre_reshape", "/layers.30/self_attn/o_proj/Linear/pre_convert", "/layers.30/self_attn/o_proj/Linear", "/layers.30/self_attn/o_proj/Linear/post_convert", "/layers.30/mlp/gate_proj/Linear/pre_reshape", "/layers.30/mlp/gate_proj/Linear/pre_convert", "/layers.30/mlp/gate_proj/Linear", "/layers.30/mlp/gate_proj/Linear/post_convert", "/layers.30/mlp/up_proj/Linear/pre_reshape", "/layers.30/mlp/up_proj/Linear/pre_convert", "/layers.30/mlp/up_proj/Linear", "/layers.30/mlp/up_proj/Linear/post_convert", "/layers.30/mlp/down_proj/Linear/pre_reshape", "/layers.30/mlp/down_proj/Linear/pre_convert", "/layers.30/mlp/down_proj/Linear", "/layers.30/mlp/down_proj/Linear/post_convert", "/layers.31/self_attn/q_proj/Linear/pre_reshape", "/layers.31/self_attn/q_proj/Linear/pre_convert", "/layers.31/self_attn/q_proj/Linear", "/layers.31/self_attn/q_proj/Linear/post_convert", "/layers.31/self_attn/k_proj/Linear/pre_reshape", "/layers.31/self_attn/k_proj/Linear/pre_convert", "/layers.31/self_attn/k_proj/Linear", "/layers.31/self_attn/k_proj/Linear/post_convert", "/layers.31/self_attn/v_proj/Linear/pre_reshape", "/layers.31/self_attn/v_proj/Linear/pre_convert", "/layers.31/self_attn/v_proj/Linear", "/layers.31/self_attn/v_proj/Linear/post_convert", "/layers.31/self_attn/o_proj/Linear/pre_reshape", "/layers.31/self_attn/o_proj/Linear/pre_convert", "/layers.31/self_attn/o_proj/Linear", "/layers.31/self_attn/o_proj/Linear/post_convert", "/layers.31/mlp/gate_proj/Linear/pre_reshape", "/layers.31/mlp/gate_proj/Linear/pre_convert", "/layers.31/mlp/gate_proj/Linear", "/layers.31/mlp/gate_proj/Linear/post_convert", "/layers.31/mlp/up_proj/Linear/pre_reshape", "/layers.31/mlp/up_proj/Linear/pre_convert", "/layers.31/mlp/up_proj/Linear", "/layers.31/mlp/up_proj/Linear/post_convert", "/layers.31/mlp/down_proj/Linear/pre_reshape", "/layers.31/mlp/down_proj/Linear/pre_convert", "/layers.31/mlp/down_proj/Linear", "/layers.31/mlp/down_proj/Linear/post_convert", "/layers.32/self_attn/q_proj/Linear/pre_reshape", "/layers.32/self_attn/q_proj/Linear/pre_convert", "/layers.32/self_attn/q_proj/Linear", "/layers.32/self_attn/q_proj/Linear/post_convert", "/layers.32/self_attn/k_proj/Linear/pre_reshape", "/layers.32/self_attn/k_proj/Linear/pre_convert", "/layers.32/self_attn/k_proj/Linear", "/layers.32/self_attn/k_proj/Linear/post_convert", "/layers.32/self_attn/v_proj/Linear/pre_reshape", "/layers.32/self_attn/v_proj/Linear/pre_convert", "/layers.32/self_attn/v_proj/Linear", "/layers.32/self_attn/v_proj/Linear/post_convert", "/layers.32/self_attn/o_proj/Linear/pre_reshape", "/layers.32/self_attn/o_proj/Linear/pre_convert", "/layers.32/self_attn/o_proj/Linear", "/layers.32/self_attn/o_proj/Linear/post_convert", "/layers.32/mlp/gate_proj/Linear/pre_reshape", "/layers.32/mlp/gate_proj/Linear/pre_convert", "/layers.32/mlp/gate_proj/Linear", "/layers.32/mlp/gate_proj/Linear/post_convert", "/layers.32/mlp/up_proj/Linear/pre_reshape", "/layers.32/mlp/up_proj/Linear/pre_convert", "/layers.32/mlp/up_proj/Linear", "/layers.32/mlp/up_proj/Linear/post_convert", "/layers.32/mlp/down_proj/Linear/pre_reshape", "/layers.32/mlp/down_proj/Linear/pre_convert", "/layers.32/mlp/down_proj/Linear", "/layers.32/mlp/down_proj/Linear/post_convert", "/layers.33/self_attn/q_proj/Linear/pre_reshape", "/layers.33/self_attn/q_proj/Linear/pre_convert", "/layers.33/self_attn/q_proj/Linear", "/layers.33/self_attn/q_proj/Linear/post_convert", "/layers.33/self_attn/k_proj/Linear/pre_reshape", "/layers.33/self_attn/k_proj/Linear/pre_convert", "/layers.33/self_attn/k_proj/Linear", "/layers.33/self_attn/k_proj/Linear/post_convert", "/layers.33/self_attn/v_proj/Linear/pre_reshape", "/layers.33/self_attn/v_proj/Linear/pre_convert", "/layers.33/self_attn/v_proj/Linear", "/layers.33/self_attn/v_proj/Linear/post_convert", "/layers.33/self_attn/o_proj/Linear/pre_reshape", "/layers.33/self_attn/o_proj/Linear/pre_convert", "/layers.33/self_attn/o_proj/Linear", "/layers.33/self_attn/o_proj/Linear/post_convert", "/layers.33/mlp/gate_proj/Linear/pre_reshape", "/layers.33/mlp/gate_proj/Linear/pre_convert", "/layers.33/mlp/gate_proj/Linear", "/layers.33/mlp/gate_proj/Linear/post_convert", "/layers.33/mlp/up_proj/Linear/pre_reshape", "/layers.33/mlp/up_proj/Linear/pre_convert", "/layers.33/mlp/up_proj/Linear", "/layers.33/mlp/up_proj/Linear/post_convert", "/layers.33/mlp/down_proj/Linear/pre_reshape", "/layers.33/mlp/down_proj/Linear/pre_convert", "/layers.33/mlp/down_proj/Linear", "/layers.33/mlp/down_proj/Linear/post_convert", "/layers.34/self_attn/q_proj/Linear/pre_reshape", "/layers.34/self_attn/q_proj/Linear/pre_convert", "/layers.34/self_attn/q_proj/Linear", "/layers.34/self_attn/q_proj/Linear/post_convert", "/layers.34/self_attn/k_proj/Linear/pre_reshape", "/layers.34/self_attn/k_proj/Linear/pre_convert", "/layers.34/self_attn/k_proj/Linear", "/layers.34/self_attn/k_proj/Linear/post_convert", "/layers.34/self_attn/v_proj/Linear/pre_reshape", "/layers.34/self_attn/v_proj/Linear/pre_convert", "/layers.34/self_attn/v_proj/Linear", "/layers.34/self_attn/v_proj/Linear/post_convert", "/layers.34/self_attn/o_proj/Linear/pre_reshape", "/layers.34/self_attn/o_proj/Linear/pre_convert", "/layers.34/self_attn/o_proj/Linear", "/layers.34/self_attn/o_proj/Linear/post_convert", "/layers.34/mlp/gate_proj/Linear/pre_reshape", "/layers.34/mlp/gate_proj/Linear/pre_convert", "/layers.34/mlp/gate_proj/Linear", "/layers.34/mlp/gate_proj/Linear/post_convert", "/layers.34/mlp/up_proj/Linear/pre_reshape", "/layers.34/mlp/up_proj/Linear/pre_convert", "/layers.34/mlp/up_proj/Linear", "/layers.34/mlp/up_proj/Linear/post_convert", "/layers.34/mlp/down_proj/Linear/pre_reshape", "/layers.34/mlp/down_proj/Linear/pre_convert", "/layers.34/mlp/down_proj/Linear", "/layers.34/mlp/down_proj/Linear/post_convert", "/layers.35/self_attn/q_proj/Linear/pre_reshape", "/layers.35/self_attn/q_proj/Linear/pre_convert", "/layers.35/self_attn/q_proj/Linear", "/layers.35/self_attn/q_proj/Linear/post_convert", "/layers.35/self_attn/k_proj/Linear/pre_reshape", "/layers.35/self_attn/k_proj/Linear/pre_convert", "/layers.35/self_attn/k_proj/Linear", "/layers.35/self_attn/k_proj/Linear/post_convert", "/layers.35/self_attn/v_proj/Linear/pre_reshape", "/layers.35/self_attn/v_proj/Linear/pre_convert", "/layers.35/self_attn/v_proj/Linear", "/layers.35/self_attn/v_proj/Linear/post_convert", "/layers.35/self_attn/o_proj/Linear/pre_reshape", "/layers.35/self_attn/o_proj/Linear/pre_convert", "/layers.35/self_attn/o_proj/Linear", "/layers.35/self_attn/o_proj/Linear/post_convert", "/layers.35/mlp/gate_proj/Linear/pre_reshape", "/layers.35/mlp/gate_proj/Linear/pre_convert", "/layers.35/mlp/gate_proj/Linear", "/layers.35/mlp/gate_proj/Linear/post_convert", "/layers.35/mlp/up_proj/Linear/pre_reshape", "/layers.35/mlp/up_proj/Linear/pre_convert", "/layers.35/mlp/up_proj/Linear", "/layers.35/mlp/up_proj/Linear/post_convert", "/layers.35/mlp/down_proj/Linear/pre_reshape", "/layers.35/mlp/down_proj/Linear/pre_convert", "/layers.35/mlp/down_proj/Linear", "/layers.35/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "7ac258de-4b9e-4046-8472-4bde442823c1" }