x86/broadwellde/floating-point.json

27b565b1SAndi Kleen[
27b565b1SAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 128-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 2 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
fae0a4dfSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.128B_PACKED_DOUBLE",
*8aae803fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational 128-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 2 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
fae0a4dfSAndi Kleen        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x4"
fae0a4dfSAndi Kleen    },
fae0a4dfSAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 128-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 4 calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
fae0a4dfSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.128B_PACKED_SINGLE",
*8aae803fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational 128-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
fae0a4dfSAndi Kleen        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x8"
fae0a4dfSAndi Kleen    },
fae0a4dfSAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 256-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 4 calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
fae0a4dfSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.256B_PACKED_DOUBLE",
*8aae803fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational 256-bit packed double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 4 computation operations, one for each element.  Applies to SSE* and AVX* packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
fae0a4dfSAndi Kleen        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x10"
fae0a4dfSAndi Kleen    },
fae0a4dfSAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 256-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 8 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 8 calculations per element.",
34cb72efSIan Rogers        "EventCode": "0xc7",
fae0a4dfSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.256B_PACKED_SINGLE",
*8aae803fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational 256-bit packed single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 8 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
fae0a4dfSAndi Kleen        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x20"
27b565b1SAndi Kleen    },
27b565b1SAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational 128-bit packed single and 256-bit packed double precision FP instructions retired; some instructions will count twice as noted below.  Each count represents 2 or/and 4 computation operations, 1 for each element.  Applies to SSE* and AVX* packed single precision and packed double precision FP instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX RCP14 RSQRT14 SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB count twice as they perform 2 calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
34cb72efSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.4_FLOPS",
34cb72efSIan Rogers        "PublicDescription": "Number of SSE/AVX computational 128-bit packed single precision and 256-bit packed double precision  floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 2 or/and 4 computation operations, one for each element.  Applies to SSE* and AVX* packed single precision floating-point and packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX RCP14 RSQRT14 SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
34cb72efSIan Rogers        "SampleAfterValue": "2000003",
27b565b1SAndi Kleen        "UMask": "0x18"
27b565b1SAndi Kleen    },
*8aae803fSIan Rogers    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational double precision floating-point instructions retired; some instructions will count twice as noted below. Applies to SSE* and AVX* scalar and packed double precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
fae0a4dfSAndi Kleen        "EventCode": "0xc7",
fae0a4dfSAndi Kleen        "EventName": "FP_ARITH_INST_RETIRED.DOUBLE",
34cb72efSIan Rogers        "SampleAfterValue": "2000006",
fae0a4dfSAndi Kleen        "UMask": "0x15"
fae0a4dfSAndi Kleen    },
*8aae803fSIan Rogers    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational packed floating-point instructions retired; some instructions will count twice as noted below. Applies to SSE* and AVX* packed double and single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
34cb72efSIan Rogers        "EventCode": "0xc7",
*8aae803fSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.PACKED",
34cb72efSIan Rogers        "SampleAfterValue": "2000004",
34cb72efSIan Rogers        "UMask": "0x3c"
fae0a4dfSAndi Kleen    },
fae0a4dfSAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational scalar floating-point instructions retired; some instructions will count twice as noted below. Each count represents 1 computation operation.   Applies to SSE* and AVX* scalar double and single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB. FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
34cb72efSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SCALAR",
*8aae803fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational scalar single precision and double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
34cb72efSIan Rogers        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x3"
fae0a4dfSAndi Kleen    },
fae0a4dfSAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational scalar double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar double precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
34cb72efSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SCALAR_DOUBLE",
*8aae803fSIan Rogers        "PublicDescription": "Number of SSE/AVX computational scalar double precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar double precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
34cb72efSIan Rogers        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x1"
fae0a4dfSAndi Kleen    },
fae0a4dfSAndi Kleen    {
*8aae803fSIan Rogers        "BriefDescription": "Number of SSE/AVX computational scalar single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
*8aae803fSIan Rogers        "EventCode": "0xc7",
34cb72efSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SCALAR_SINGLE",
34cb72efSIan Rogers        "PublicDescription": "Number of SSE/AVX computational scalar single precision floating-point instructions retired; some instructions will count twice as noted below.  Each count represents 1 computational operation. Applies to SSE* and AVX* scalar single precision floating-point instructions: ADD SUB MUL DIV MIN MAX SQRT RSQRT RCP FM(N)ADD/SUB.  FM(N)ADD/SUB instructions count twice as they perform 2 calculations per element. The DAZ and FTZ flags in the MXCSR register need to be set when using these events.",
34cb72efSIan Rogers        "SampleAfterValue": "2000003",
34cb72efSIan Rogers        "UMask": "0x2"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of SSE/AVX computational single precision floating-point instructions retired; some instructions will count twice as noted below. Applies to SSE* and AVX* scalar and packed single precision floating-point instructions: ADD SUB HADD HSUB SUBADD MUL DIV MIN MAX SQRT RSQRT RCP SQRT DPP FM(N)ADD/SUB.  DPP and FM(N)ADD/SUB instructions count twice as they perform multiple calculations per element.",
fae0a4dfSAndi Kleen        "EventCode": "0xc7",
34cb72efSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.SINGLE",
34cb72efSIan Rogers        "SampleAfterValue": "2000005",
34cb72efSIan Rogers        "UMask": "0x2a"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of any Vector retired FP arithmetic instructions",
fae0a4dfSAndi Kleen        "EventCode": "0xc7",
34cb72efSIan Rogers        "EventName": "FP_ARITH_INST_RETIRED.VECTOR",
fae0a4dfSAndi Kleen        "SampleAfterValue": "2000003",
fae0a4dfSAndi Kleen        "UMask": "0xfc"
fae0a4dfSAndi Kleen    },
34cb72efSIan Rogers    {
fae0a4dfSAndi Kleen        "BriefDescription": "Cycles with any input/output SSE or FP assist",
fae0a4dfSAndi Kleen        "CounterMask": "1",
34cb72efSIan Rogers        "EventCode": "0xCA",
34cb72efSIan Rogers        "EventName": "FP_ASSIST.ANY",
34cb72efSIan Rogers        "PublicDescription": "This event counts cycles with any input and output SSE or x87 FP assist. If an input and output assist are detected on the same cycle the event increments by 1.",
34cb72efSIan Rogers        "SampleAfterValue": "100003",
fae0a4dfSAndi Kleen        "UMask": "0x1e"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of SIMD FP assists due to input values",
34cb72efSIan Rogers        "EventCode": "0xCA",
34cb72efSIan Rogers        "EventName": "FP_ASSIST.SIMD_INPUT",
34cb72efSIan Rogers        "PublicDescription": "This event counts any input SSE* FP assist - invalid operation, denormal operand, dividing by zero, SNaN operand. Counting includes only cases involving penalties that required micro-code assist intervention.",
34cb72efSIan Rogers        "SampleAfterValue": "100003",
34cb72efSIan Rogers        "UMask": "0x10"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of SIMD FP assists due to Output values",
34cb72efSIan Rogers        "EventCode": "0xCA",
34cb72efSIan Rogers        "EventName": "FP_ASSIST.SIMD_OUTPUT",
34cb72efSIan Rogers        "PublicDescription": "This event counts the number of SSE* floating point (FP) micro-code assist (numeric overflow/underflow) when the output value (destination register) is invalid. Counting covers only cases involving penalties that require micro-code assist intervention.",
34cb72efSIan Rogers        "SampleAfterValue": "100003",
34cb72efSIan Rogers        "UMask": "0x8"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of X87 assists due to input value.",
34cb72efSIan Rogers        "EventCode": "0xCA",
34cb72efSIan Rogers        "EventName": "FP_ASSIST.X87_INPUT",
34cb72efSIan Rogers        "PublicDescription": "This event counts x87 floating point (FP) micro-code assist (invalid operation, denormal operand, SNaN operand) when the input value (one of the source operands to an FP instruction) is invalid.",
34cb72efSIan Rogers        "SampleAfterValue": "100003",
34cb72efSIan Rogers        "UMask": "0x4"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of X87 assists due to output value.",
34cb72efSIan Rogers        "EventCode": "0xCA",
34cb72efSIan Rogers        "EventName": "FP_ASSIST.X87_OUTPUT",
34cb72efSIan Rogers        "PublicDescription": "This event counts the number of x87 floating point (FP) micro-code assist (numeric overflow/underflow, inexact result) when the output value (destination register) is invalid.",
34cb72efSIan Rogers        "SampleAfterValue": "100003",
34cb72efSIan Rogers        "UMask": "0x2"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of SIMD Move Elimination candidate uops that were eliminated.",
34cb72efSIan Rogers        "EventCode": "0x58",
34cb72efSIan Rogers        "EventName": "MOVE_ELIMINATION.SIMD_ELIMINATED",
34cb72efSIan Rogers        "SampleAfterValue": "1000003",
34cb72efSIan Rogers        "UMask": "0x2"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of SIMD Move Elimination candidate uops that were not eliminated.",
34cb72efSIan Rogers        "EventCode": "0x58",
34cb72efSIan Rogers        "EventName": "MOVE_ELIMINATION.SIMD_NOT_ELIMINATED",
34cb72efSIan Rogers        "SampleAfterValue": "1000003",
34cb72efSIan Rogers        "UMask": "0x8"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
34cb72efSIan Rogers        "BriefDescription": "Number of transitions from AVX-256 to legacy SSE when penalty applicable.",
34cb72efSIan Rogers        "Errata": "BDM30",
34cb72efSIan Rogers        "EventCode": "0xC1",
34cb72efSIan Rogers        "EventName": "OTHER_ASSISTS.AVX_TO_SSE",
34cb72efSIan Rogers        "PublicDescription": "This event counts the number of transitions from AVX-256 to legacy SSE when penalty is applicable.",
34cb72efSIan Rogers        "SampleAfterValue": "100003",
34cb72efSIan Rogers        "UMask": "0x8"
34cb72efSIan Rogers    },
34cb72efSIan Rogers    {
27b565b1SAndi Kleen        "BriefDescription": "Number of transitions from SSE to AVX-256 when penalty applicable.",
27b565b1SAndi Kleen        "Errata": "BDM30",
        "EventCode": "0xC1",
        "EventName": "OTHER_ASSISTS.SSE_TO_AVX",
        "PublicDescription": "This event counts the number of transitions from legacy SSE to AVX-256 when penalty is applicable.",
        "SampleAfterValue": "100003",
        "UMask": "0x10"
    },
    {
        "BriefDescription": "Micro-op dispatches cancelled due to insufficient SIMD physical register file read ports",
        "EventCode": "0xA0",
        "EventName": "UOP_DISPATCHES_CANCELLED.SIMD_PRF",
        "PublicDescription": "This event counts the number of micro-operations cancelled after they were dispatched from the scheduler to the execution units when the total number of physical register read ports across all dispatch ports exceeds the read bandwidth of the physical register file.  The SIMD_PRF subevent applies to the following instructions: VDPPS, DPPS, VPCMPESTRI, PCMPESTRI, VPCMPESTRM, PCMPESTRM, VFMADD*, VFMADDSUB*, VFMSUB*, VMSUBADD*, VFNMADD*, VFNMSUB*.  See the Broadwell Optimization Guide for more information.",
        "SampleAfterValue": "2000003",
        "UMask": "0x3"
    }
]