x86/broadwell/floating-point.json

b74d1315SAndi Kleen[
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 128-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 2 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
b74d1315SAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.128B_PACKED_DOUBLE",
*78036545SIan Rogers        "PublicDescription": "Number of SSE/AVX computational 128-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 2 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
b74d1315SAndi Kleen        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0x4"
b74d1315SAndi Kleen    },
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 128-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 4 calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
b74d1315SAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.128B_PACKED_SINGLE",
*78036545SIan Rogers        "PublicDescription": "Number of SSE/AVX computational 128-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
b74d1315SAndi Kleen        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0x8"
b74d1315SAndi Kleen    },
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 256-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 4 calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
b74d1315SAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.256B_PACKED_DOUBLE",
*78036545SIan Rogers        "PublicDescription": "Number of SSE/AVX computational 256-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
b74d1315SAndi Kleen        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0x10"
b74d1315SAndi Kleen    },
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 256-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 8 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 8 calculations per element.",
b3ab8adcSAndi Kleen        "EventCode": "0xc7",
b3ab8adcSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.256B_PACKED_SINGLE",
*78036545SIan Rogers        "PublicDescription": "Number of SSE/AVX computational 256-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 8 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
b3ab8adcSAndi Kleen        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0x20"
b3ab8adcSAndi Kleen    },
b3ab8adcSAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 128-bit packed single and 256-bit packed double precision FP instructions retired; some instructions will count twice as noted below.  Each count represents 2 or/and 4 computation operations, 1 for each element.  Applies to SSE* and AVX* packed single precision and packed double precision FP instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX RCP14 RSQRT14 SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB count twice as they perform 2 calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
10e8d85fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.4_FLOPS",
10e8d85fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational 128-bit packed single precision and 256-bit packed double precision  floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 2 or/and 4 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point and packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX RCP14 RSQRT14 SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
10e8d85fSIan Rogers        "SampleAfterValue": "2000003",
b3ab8adcSAndi Kleen        "UMask": "0x18"
b3ab8adcSAndi Kleen    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational double precision floating-point instructions retired; some instructions will count twice as noted below. Applies to SSE* and AVX* scalar and packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
b3ab8adcSAndi Kleen        "EventCode": "0xc7",
b3ab8adcSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.DOUBLE",
10e8d85fSIan Rogers        "SampleAfterValue": "2000006",
b3ab8adcSAndi Kleen        "UMask": "0x15"
b3ab8adcSAndi Kleen    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational packed floating-point instructions retired; some instructions will count twice as noted below. Applies to SSE* and AVX* packed double and single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
*78036545SIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.PACKED",
10e8d85fSIan Rogers        "SampleAfterValue": "2000004",
10e8d85fSIan Rogers        "UMask": "0x3c"
b74d1315SAndi Kleen    },
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational scalar floating-point instructions retired; some instructions will count twice as noted below. Each count represents 1 computation operation.   Applies to SSE* and AVX* scalar double and single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB. FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
10e8d85fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SCALAR",
*78036545SIan Rogers        "PublicDescription": "Number of SSE/AVX computational scalar single precision and double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
10e8d85fSIan Rogers        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0x3"
b74d1315SAndi Kleen    },
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational scalar double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar double precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
10e8d85fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SCALAR_DOUBLE",
*78036545SIan Rogers        "PublicDescription": "Number of SSE/AVX computational scalar double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar double precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
10e8d85fSIan Rogers        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0x1"
b74d1315SAndi Kleen    },
b74d1315SAndi Kleen    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational scalar single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
10e8d85fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SCALAR_SINGLE",
10e8d85fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational scalar single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
10e8d85fSIan Rogers        "SampleAfterValue": "2000003",
b74d1315SAndi Kleen        "UMask": "0x2"
b74d1315SAndi Kleen    },
10e8d85fSIan Rogers    {
b74d1315SAndi Kleen        "BriefDescription": "Number of SSE/AVX computational single precision floating-point instructions retired; some instructions will count twice as noted below. Applies to SSE* and AVX* scalar and packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
10e8d85fSIan Rogers        "EventCode": "0xc7",
10e8d85fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SINGLE",
10e8d85fSIan Rogers        "SampleAfterValue": "2000005",
10e8d85fSIan Rogers        "UMask": "0x2a"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of any Vector retired FP arithmetic instructions",
10e8d85fSIan Rogers        "EventCode": "0xc7",
10e8d85fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.VECTOR",
10e8d85fSIan Rogers        "SampleAfterValue": "2000003",
10e8d85fSIan Rogers        "UMask": "0xfc"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Cycles with any input/output SSE or FP assist",
10e8d85fSIan Rogers        "CounterMask": "1",
10e8d85fSIan Rogers        "EventCode": "0xCA",
10e8d85fSIan Rogers        "EventName": "FP_ASSIST.ANY",
10e8d85fSIan Rogers        "PublicDescription": "This event counts cycles with any input and output SSE or x87 FP assist. If an input and output assist are detected on the same cycle the event increments by 1.",
10e8d85fSIan Rogers        "SampleAfterValue": "100003",
10e8d85fSIan Rogers        "UMask": "0x1e"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SIMD FP assists due to input values",
10e8d85fSIan Rogers        "EventCode": "0xCA",
10e8d85fSIan Rogers        "EventName": "FP_ASSIST.SIMD_INPUT",
10e8d85fSIan Rogers        "PublicDescription": "This event counts any input SSE* FP assist - invalid operation, denormal operand, dividing by zero, SNaN operand. Counting includes only cases involving penalties that required micro-code assist intervention.",
10e8d85fSIan Rogers        "SampleAfterValue": "100003",
10e8d85fSIan Rogers        "UMask": "0x10"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SIMD FP assists due to Output values",
10e8d85fSIan Rogers        "EventCode": "0xCA",
10e8d85fSIan Rogers        "EventName": "FP_ASSIST.SIMD_OUTPUT",
10e8d85fSIan Rogers        "PublicDescription": "This event counts the number of SSE* floating point (FP) micro-code assist (numeric overflow/underflow) when the output value (destination register) is invalid. Counting covers only cases involving penalties that require micro-code assist intervention.",
10e8d85fSIan Rogers        "SampleAfterValue": "100003",
10e8d85fSIan Rogers        "UMask": "0x8"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of X87 assists due to input value.",
10e8d85fSIan Rogers        "EventCode": "0xCA",
10e8d85fSIan Rogers        "EventName": "FP_ASSIST.X87_INPUT",
10e8d85fSIan Rogers        "PublicDescription": "This event counts x87 floating point (FP) micro-code assist (invalid operation, denormal operand, SNaN operand) when the input value (one of the source operands to an FP instruction) is invalid.",
10e8d85fSIan Rogers        "SampleAfterValue": "100003",
10e8d85fSIan Rogers        "UMask": "0x4"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of X87 assists due to output value.",
10e8d85fSIan Rogers        "EventCode": "0xCA",
10e8d85fSIan Rogers        "EventName": "FP_ASSIST.X87_OUTPUT",
10e8d85fSIan Rogers        "PublicDescription": "This event counts the number of x87 floating point (FP) micro-code assist (numeric overflow/underflow, inexact result) when the output value (destination register) is invalid.",
10e8d85fSIan Rogers        "SampleAfterValue": "100003",
10e8d85fSIan Rogers        "UMask": "0x2"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SIMD Move Elimination candidate uops that were eliminated.",
10e8d85fSIan Rogers        "EventCode": "0x58",
10e8d85fSIan Rogers        "EventName": "MOVE_ELIMINATION.SIMD_ELIMINATED",
10e8d85fSIan Rogers        "SampleAfterValue": "1000003",
10e8d85fSIan Rogers        "UMask": "0x2"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of SIMD Move Elimination candidate uops that were not eliminated.",
10e8d85fSIan Rogers        "EventCode": "0x58",
10e8d85fSIan Rogers        "EventName": "MOVE_ELIMINATION.SIMD_NOT_ELIMINATED",
10e8d85fSIan Rogers        "SampleAfterValue": "1000003",
10e8d85fSIan Rogers        "UMask": "0x8"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
10e8d85fSIan Rogers        "BriefDescription": "Number of transitions from AVX-256 to legacy SSE when penalty applicable.",
10e8d85fSIan Rogers        "Errata": "BDM30",
10e8d85fSIan Rogers        "EventCode": "0xC1",
10e8d85fSIan Rogers        "EventName": "OTHER_ASSISTS.AVX_TO_SSE",
10e8d85fSIan Rogers        "PublicDescription": "This event counts the number of transitions from AVX-256 to legacy SSE when penalty is applicable.",
10e8d85fSIan Rogers        "SampleAfterValue": "100003",
10e8d85fSIan Rogers        "UMask": "0x8"
10e8d85fSIan Rogers    },
10e8d85fSIan Rogers    {
b74d1315SAndi Kleen        "BriefDescription": "Number of transitions from SSE to AVX-256 when penalty applicable.",
b74d1315SAndi Kleen        "Errata": "BDM30",
        "EventCode": "0xC1",
        "EventName": "OTHER_ASSISTS.SSE_TO_AVX",
        "PublicDescription": "This event counts the number of transitions from legacy SSE to AVX-256 when penalty is applicable.",
        "SampleAfterValue": "100003",
        "UMask": "0x10"
    },
    {
        "BriefDescription": "Micro-op dispatches cancelled due to insufficient SIMD physical register file read ports",
        "EventCode": "0xA0",
        "EventName": "UOP_DISPATCHES_CANCELLED.SIMD_PRF",
        "PublicDescription": "This event counts the number of micro-operations cancelled after they were dispatched from the scheduler to the execution units when the total number of physical register read ports across all dispatch ports exceeds the read bandwidth of the physical register file.  The SIMD_PRF subevent applies to the following instructions: VDPPS, DPPS, VPCMPESTRI, PCMPESTRI, VPCMPESTRM, PCMPESTRM, VFMADD*, VFMADDSUB*, VFMSUB*, VMSUBADD*, VFNMADD*, VFNMSUB*.  See the Broadwell Optimization Guide for more information.",
        "SampleAfterValue": "2000003",
        "UMask": "0x3"
    }
]