perf vendor events: Update Intel sandybridge

author Ian Rogers <irogers@google.com>

Wed, 27 Jul 2022 22:08:23 +0000 (15:08 -0700)

committer Arnaldo Carvalho de Melo <acme@redhat.com>

Thu, 28 Jul 2022 19:09:58 +0000 (16:09 -0300)
author Ian Rogers <irogers@google.com>
Wed, 27 Jul 2022 22:08:23 +0000 (15:08 -0700)
committer Arnaldo Carvalho de Melo <acme@redhat.com>
Thu, 28 Jul 2022 19:09:58 +0000 (16:09 -0300)
diff --git a/tools/perf/pmu-events/arch/x86/mapfile.csv b/tools/perf/pmu-events/arch/x86/mapfile.csv

index 2f9419ee2d296283aef70956c8b38b11a6cf262c..0b56c4a8a3a8df93308fdb171716dedcf3e38e46 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/mapfile.csv
+++ b/tools/perf/pmu-events/arch/x86/mapfile.csv
@@ -19,12 +19,12 @@ GenuineIntel-6-(57|85),v9,knightslanding,core
  GenuineIntel-6-AA,v1.00,meteorlake,core
  GenuineIntel-6-1[AEF],v3,nehalemep,core
  GenuineIntel-6-2E,v3,nehalemex,core
+GenuineIntel-6-2A,v17,sandybridge,core
  GenuineIntel-6-[4589]E,v24,skylake,core
  GenuineIntel-6-A[56],v24,skylake,core
  GenuineIntel-6-37,v13,silvermont,core
  GenuineIntel-6-4D,v13,silvermont,core
  GenuineIntel-6-4C,v13,silvermont,core
-GenuineIntel-6-2A,v15,sandybridge,core
  GenuineIntel-6-2C,v2,westmereep-dp,core
  GenuineIntel-6-25,v2,westmereep-sp,core
  GenuineIntel-6-2F,v2,westmereex,core
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/cache.json b/tools/perf/pmu-events/arch/x86/sandybridge/cache.json

index 92a7269eb4442d7d9d7fedfafca81f8ed57ad4b4..a1d6223521311a624ebf996604efd7b480f5fced 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/cache.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/cache.json
@@ -1876,4 +1876,4 @@
          "SampleAfterValue": "100003",
          "UMask": "0x10"
      }
-]
-\ No newline at end of file
+]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/floating-point.json b/tools/perf/pmu-events/arch/x86/sandybridge/floating-point.json

index 713878fd062b8e1173dbee7c27689487476e1fd4..eb2ff2cfdf6b0b7971d0a0097d9a51d92409877c 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/floating-point.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/floating-point.json
@@ -135,4 +135,4 @@
          "SampleAfterValue": "2000003",
          "UMask": "0x1"
      }
-]
-\ No newline at end of file
+]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/frontend.json b/tools/perf/pmu-events/arch/x86/sandybridge/frontend.json

index fa22f9463b66c88b2d644ecdecc928619dc33847..e2c82e43a2deb91abd6d3b896e95348e11010840 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/frontend.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/frontend.json
@@ -176,7 +176,7 @@
          "CounterMask": "1",
          "EventCode": "0x79",
          "EventName": "IDQ.MS_CYCLES",
-        "PublicDescription": "This event counts cycles during which the microcode sequencer assisted the front-end in delivering uops.  Microcode assists are used for complex instructions or scenarios that can't be handled by the standard decoder.  Using other instructions, if possible, will usually improve performance.  See the Intel 64 and IA-32 Architectures Optimization Reference Manual for more information.",
+        "PublicDescription": "This event counts cycles during which the microcode sequencer assisted the front-end in delivering uops.  Microcode assists are used for complex instructions or scenarios that can't be handled by the standard decoder.  Using other instructions, if possible, will usually improve performance.  See the Intel(R) 64 and IA-32 Architectures Optimization Reference Manual for more information.",
          "SampleAfterValue": "2000003",
          "UMask": "0x30"
      },
@@ -311,4 +311,4 @@
          "SampleAfterValue": "2000003",
          "UMask": "0x1"
      }
-]
-\ No newline at end of file
+]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/memory.json b/tools/perf/pmu-events/arch/x86/sandybridge/memory.json

index 931892d34076bc6f31022810743f166582c8896f..3c283ca309f357981911112637bd74ef69c4a332 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/memory.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/memory.json
@@ -442,4 +442,4 @@
          "SampleAfterValue": "100003",
          "UMask": "0x1"
      }
-]
-\ No newline at end of file
+]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/other.json b/tools/perf/pmu-events/arch/x86/sandybridge/other.json

index e251f535ec092217215492f5b2f5b63f3a15541a..2f873ab14156b769e00c4e19a57727ca10376fc5 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/other.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/other.json
@@ -55,4 +55,4 @@
          "SampleAfterValue": "2000003",
          "UMask": "0x1"
      }
-]
-\ No newline at end of file
+]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/pipeline.json b/tools/perf/pmu-events/arch/x86/sandybridge/pipeline.json

index b9a3f194a00a8173faece3d77cc5db3ff10bf0a8..2c3b6c92aa6b742cfb4399a21c806ac270903078 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/pipeline.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/pipeline.json
@@ -609,7 +609,7 @@
          "UMask": "0x3"
      },
      {
-        "BriefDescription": "Number of occurences waiting for the checkpoints in Resource Allocation Table (RAT) to be recovered after Nuke due to all other cases except JEClear (e.g. whenever a ucode assist is needed like SSE exception, memory disambiguation, etc...).",
+        "BriefDescription": "Number of occurrences waiting for the checkpoints in Resource Allocation Table (RAT) to be recovered after Nuke due to all other cases except JEClear (e.g. whenever a ucode assist is needed like SSE exception, memory disambiguation, etc...).",
          "Counter": "0,1,2,3",
          "CounterHTOff": "0,1,2,3,4,5,6,7",
          "CounterMask": "1",
@@ -652,7 +652,7 @@
          "CounterHTOff": "0,1,2,3,4,5,6,7",
          "EventCode": "0x03",
          "EventName": "LD_BLOCKS.STORE_FORWARD",
-        "PublicDescription": "This event counts loads that followed a store to the same address, where the data could not be forwarded inside the pipeline from the store to the load.  The most common reason why store forwarding would be blocked is when a load's address range overlaps with a preceeding smaller uncompleted store.  See the table of not supported store forwards in the Intel 64 and IA-32 Architectures Optimization Reference Manual.  The penalty for blocked store forwarding is that the load must wait for the store to complete before it can be issued.",
+        "PublicDescription": "This event counts loads that followed a store to the same address, where the data could not be forwarded inside the pipeline from the store to the load.  The most common reason why store forwarding would be blocked is when a load's address range overlaps with a preceeding smaller uncompleted store.  See the table of not supported store forwards in the Intel(R) 64 and IA-32 Architectures Optimization Reference Manual.  The penalty for blocked store forwarding is that the load must wait for the store to complete before it can be issued.",
          "SampleAfterValue": "100003",
          "UMask": "0x2"
      },
@@ -778,7 +778,7 @@
          "CounterMask": "1",
          "EventCode": "0x59",
          "EventName": "PARTIAL_RAT_STALLS.FLAGS_MERGE_UOP_CYCLES",
-        "PublicDescription": "This event counts the number of cycles spent executing performance-sensitive flags-merging uops. For example, shift CL (merge_arith_flags). For more details, See the Intel 64 and IA-32 Architectures Optimization Reference Manual.",
+        "PublicDescription": "This event counts the number of cycles spent executing performance-sensitive flags-merging uops. For example, shift CL (merge_arith_flags). For more details, See the Intel(R) 64 and IA-32 Architectures Optimization Reference Manual.",
          "SampleAfterValue": "2000003",
          "UMask": "0x20"
      },
@@ -797,7 +797,7 @@
          "CounterHTOff": "0,1,2,3,4,5,6,7",
          "EventCode": "0x59",
          "EventName": "PARTIAL_RAT_STALLS.SLOW_LEA_WINDOW",
-        "PublicDescription": "This event counts the number of cycles with at least one slow LEA uop being allocated. A uop is generally considered as slow LEA if it has three sources (for example, two sources and immediate) regardless of whether it is a result of LEA instruction or not. Examples of the slow LEA uop are or uops with base, index, and offset source operands using base and index reqisters, where base is EBR/RBP/R13, using RIP relative or 16-bit addressing modes. See the Intel 64 and IA-32 Architectures Optimization Reference Manual for more details about slow LEA instructions.",
+        "PublicDescription": "This event counts the number of cycles with at least one slow LEA uop being allocated. A uop is generally considered as slow LEA if it has three sources (for example, two sources and immediate) regardless of whether it is a result of LEA instruction or not. Examples of the slow LEA uop are or uops with base, index, and offset source operands using base and index reqisters, where base is EBR/RBP/R13, using RIP relative or 16-bit addressing modes. See the Intel(R) 64 and IA-32 Architectures Optimization Reference Manual for more details about slow LEA instructions.",
          "SampleAfterValue": "2000003",
          "UMask": "0x40"
      },
@@ -1209,4 +1209,4 @@
          "SampleAfterValue": "2000003",
          "UMask": "0x1"
      }
-]
-\ No newline at end of file
+]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/snb-metrics.json b/tools/perf/pmu-events/arch/x86/sandybridge/snb-metrics.json

index c8e7050d9c2668f8abf7b2d98c48b571cebe01ef..ae7ed267b2a2226036c80cce9c2147ac69771606 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/snb-metrics.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/snb-metrics.json
@@ -124,7 +124,7 @@
          "MetricName": "FLOPc_SMT"
      },
      {
-        "BriefDescription": "Instruction-Level-Parallelism (average number of uops executed when there is at least 1 uop executed)",
+        "BriefDescription": "Instruction-Level-Parallelism (average number of uops executed when there is execution) per-core",
          "MetricExpr": "UOPS_DISPATCHED.THREAD / (( cpu@UOPS_DISPATCHED.CORE\\,cmask\\=1@ / 2 ) if #SMT_on else cpu@UOPS_DISPATCHED.CORE\\,cmask\\=1@)",
          "MetricGroup": "Backend;Cor;Pipeline;PortsUtil",
          "MetricName": "ILP"
@@ -141,6 +141,12 @@
          "MetricGroup": "Summary;TmaL1",
          "MetricName": "Instructions"
      },
+    {
+        "BriefDescription": "Average number of Uops retired in cycles where at least one uop has retired.",
+        "MetricExpr": "UOPS_RETIRED.RETIRE_SLOTS / cpu@UOPS_RETIRED.RETIRE_SLOTS\\,cmask\\=1@",
+        "MetricGroup": "Pipeline;Ret",
+        "MetricName": "Retire"
+    },
      {
          "BriefDescription": "Fraction of Uops delivered by the DSB (aka Decoded ICache; or Uop Cache)",
          "MetricExpr": "IDQ.DSB_UOPS / (( IDQ.DSB_UOPS + LSD.UOPS + IDQ.MITE_UOPS + IDQ.MS_UOPS ) )",
@@ -163,7 +169,8 @@
          "BriefDescription": "Giga Floating Point Operations Per Second",
          "MetricExpr": "( ( 1 * ( FP_COMP_OPS_EXE.SSE_SCALAR_SINGLE + FP_COMP_OPS_EXE.SSE_SCALAR_DOUBLE ) + 2 * FP_COMP_OPS_EXE.SSE_PACKED_DOUBLE + 4 * ( FP_COMP_OPS_EXE.SSE_PACKED_SINGLE + SIMD_FP_256.PACKED_DOUBLE ) + 8 * SIMD_FP_256.PACKED_SINGLE ) / 1000000000 ) / duration_time",
          "MetricGroup": "Cor;Flops;HPC",
-        "MetricName": "GFLOPs"
+        "MetricName": "GFLOPs",
+        "PublicDescription": "Giga Floating Point Operations Per Second. Aggregate across all supported options of: FP precisions, scalar and vector instructions, vector-width and AMX engine."
      },
      {
          "BriefDescription": "Average Frequency Utilization relative nominal frequency",
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/uncore-other.json b/tools/perf/pmu-events/arch/x86/sandybridge/uncore-other.json

index 6278068908cf8f7a0b43890bb66055482eed0558..88f1e326205fa5426dc6e6f586f71aaab78d5516 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/uncore-other.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/uncore-other.json
@@ -82,10 +82,10 @@
      {
          "BriefDescription": "This 48-bit fixed counter counts the UCLK cycles.",
          "Counter": "Fixed",
+        "EventCode": "0xff",
          "EventName": "UNC_CLOCK.SOCKET",
          "PerPkg": "1",
          "PublicDescription": "This 48-bit fixed counter counts the UCLK cycles.",
-        "UMask": "0x01",
          "Unit": "ARB"
      }
  ]
diff --git a/tools/perf/pmu-events/arch/x86/sandybridge/virtual-memory.json b/tools/perf/pmu-events/arch/x86/sandybridge/virtual-memory.json

index 4dd136d00a10b8ecd43a8fd3c080253bad9b592a..98362abba1a7d7347cf029c23d24bbed602b7c01 100644 (file)
--- a/tools/perf/pmu-events/arch/x86/sandybridge/virtual-memory.json
+++ b/tools/perf/pmu-events/arch/x86/sandybridge/virtual-memory.json
@@ -146,4 +146,4 @@
          "SampleAfterValue": "100007",
          "UMask": "0x20"
      }
-]
-\ No newline at end of file
+]
author	Ian Rogers <irogers@google.com>
	Wed, 27 Jul 2022 22:08:23 +0000 (15:08 -0700)
committer	Arnaldo Carvalho de Melo <acme@redhat.com>
	Thu, 28 Jul 2022 19:09:58 +0000 (16:09 -0300)
tools/perf/pmu-events/arch/x86/mapfile.csv		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/cache.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/floating-point.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/frontend.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/memory.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/other.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/pipeline.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/snb-metrics.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/uncore-other.json		patch \| blob \| blame \| history
tools/perf/pmu-events/arch/x86/sandybridge/virtual-memory.json		patch \| blob \| blame \| history