Commit 4c290d4f authored by Thomas Richter's avatar Thomas Richter Committed by Arnaldo Carvalho de Melo
Browse files

perf vendor events s390: Add metric for TLB and cache

Add metrics for tlb and cache statistics:

- finite_cpi: Cycles per Instructions from Finite cache/memory
- est_cpi: Estimated Instruction Complexity CPI infinite Level 1
- scpl1m: Estimated Sourcing Cycles per Level 1 Miss
- tlb_percent: Estimated TLB CPU percentage of Total CPU
- tlb_miss: Estimated Cycles per TLB Miss

For details about the formulas see this documentation:

  https://www.ibm.com/support/pages/system/files/inline-files/CPU%20MF%20Formulas%20including%20z16%20-%20May%202022_1.pdf



Output after:

  # ./perf stat -M tlb_miss -- dd if=/dev/zero of=/dev/null bs=1M count=10K
  ... dd output removed

  Performance counter stats for 'dd if=/dev/zero of=/dev/null bs=1M count=10K':

           667,726      DTLB2_MISSES             #   440.96 tlb_miss
               198      ITLB2_WRITES
       795,170,260      L1C_TLB2_MISSES
             9,478      ITLB2_MISSES
               820      DTLB2_WRITES
     1,197,126,869      L1D_PENALTY_CYCLES
         2,457,447      L1I_PENALTY_CYCLES

       1.249342187 seconds time elapsed

       0.001030000 seconds user
       1.248105000 seconds sys

  #

Signed-off-by: default avatarThomas Richter <tmricht@linux.ibm.com>
Acked-by: default avatarIan Rogers <irogers@google.com>
Acked-By: default avatarSumanth Korikkar <sumanthk@linux.ibm.com>
Cc: Heiko Carstens <hca@linux.ibm.com>
Cc: Sven Schnelle <svens@linux.ibm.com>
Cc: Vasily Gorbik <gor@linux.ibm.com>
Link: https://lore.kernel.org/r/20230313080201.2440201-3-tmricht@linux.ibm.com


Signed-off-by: default avatarArnaldo Carvalho de Melo <acme@redhat.com>
parent 850eea23
Loading
Loading
Loading
Loading
+30 −0
Original line number Diff line number Diff line
@@ -43,5 +43,35 @@
    "BriefDescription": "Percentage sourced from memory",
    "MetricName": "memp",
    "MetricExpr": "((L1D_ONNODE_MEM_SOURCED_WRITES + L1D_ONDRAWER_MEM_SOURCED_WRITES + L1D_OFFDRAWER_MEM_SOURCED_WRITES + L1D_ONCHIP_MEM_SOURCED_WRITES + L1I_ONNODE_MEM_SOURCED_WRITES + L1I_ONDRAWER_MEM_SOURCED_WRITES + L1I_OFFDRAWER_MEM_SOURCED_WRITES + L1I_ONCHIP_MEM_SOURCED_WRITES) / (L1I_DIR_WRITES + L1D_DIR_WRITES)) * 100"
  },
  {
    "BriefDescription": "Cycles per Instructions from Finite cache/memory",
    "MetricName": "finite_cpi",
    "MetricExpr": "L1C_TLB1_MISSES / INSTRUCTIONS"
  },
  {
    "BriefDescription": "Estimated Instruction Complexity CPI infinite Level 1",
    "MetricName": "est_cpi",
    "MetricExpr": "(CPU_CYCLES / INSTRUCTIONS) - (L1C_TLB1_MISSES / INSTRUCTIONS)"
  },
  {
    "BriefDescription": "Estimated Sourcing Cycles per Level 1 Miss",
    "MetricName": "scpl1m",
    "MetricExpr": "L1C_TLB1_MISSES / (L1I_DIR_WRITES + L1D_DIR_WRITES)"
  },
  {
    "BriefDescription": "Estimated TLB CPU percentage of Total CPU",
    "MetricName": "tlb_percent",
    "MetricExpr": "((DTLB1_MISSES + ITLB1_MISSES) / CPU_CYCLES) * (L1C_TLB1_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES)) * 100"
  },
  {
    "BriefDescription": "Estimated Cycles per TLB Miss",
    "MetricName": "tlb_miss",
    "MetricExpr": "((DTLB1_MISSES + ITLB1_MISSES) / (DTLB1_WRITES + ITLB1_WRITES)) * (L1C_TLB1_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES))"
  },
  {
    "BriefDescription": "Page Table Entry misses",
    "MetricName": "pte_miss",
    "MetricExpr": "(TLB2_PTE_WRITES / (DTLB1_WRITES + ITLB1_WRITES)) * 100"
  }
]
+25 −0
Original line number Diff line number Diff line
@@ -43,5 +43,30 @@
    "BriefDescription": "Percentage sourced from memory",
    "MetricName": "memp",
    "MetricExpr": "((L1D_ONCHIP_MEMORY_SOURCED_WRITES + L1D_ONCLUSTER_MEMORY_SOURCED_WRITES + L1D_OFFCLUSTER_MEMORY_SOURCED_WRITES + L1D_OFFDRAWER_MEMORY_SOURCED_WRITES + L1I_ONCHIP_MEMORY_SOURCED_WRITES + L1I_ONCLUSTER_MEMORY_SOURCED_WRITES + L1I_OFFCLUSTER_MEMORY_SOURCED_WRITES + L1I_OFFDRAWER_MEMORY_SOURCED_WRITES) / (L1I_DIR_WRITES + L1D_DIR_WRITES)) * 100"
  },
  {
    "BriefDescription": "Cycles per Instructions from Finite cache/memory",
    "MetricName": "finite_cpi",
    "MetricExpr": "L1C_TLB2_MISSES / INSTRUCTIONS"
  },
  {
    "BriefDescription": "Estimated Instruction Complexity CPI infinite Level 1",
    "MetricName": "est_cpi",
    "MetricExpr": "(CPU_CYCLES / INSTRUCTIONS) - (L1C_TLB2_MISSES / INSTRUCTIONS)"
  },
  {
    "BriefDescription": "Estimated Sourcing Cycles per Level 1 Miss",
    "MetricName": "scpl1m",
    "MetricExpr": "L1C_TLB2_MISSES / (L1I_DIR_WRITES + L1D_DIR_WRITES)"
  },
  {
    "BriefDescription": "Estimated TLB CPU percentage of Total CPU",
    "MetricName": "tlb_percent",
    "MetricExpr": "((DTLB2_MISSES + ITLB2_MISSES) / CPU_CYCLES) * (L1C_TLB2_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES)) * 100"
  },
  {
    "BriefDescription": "Estimated Cycles per TLB Miss",
    "MetricName": "tlb_miss",
    "MetricExpr": "((DTLB2_MISSES + ITLB2_MISSES) / (DTLB2_WRITES + ITLB2_WRITES)) * (L1C_TLB2_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES))"
  }
]
+25 −0
Original line number Diff line number Diff line
@@ -43,5 +43,30 @@
    "BriefDescription": "Percentage sourced from memory",
    "MetricName": "memp",
    "MetricExpr": "((L1D_ONCHIP_MEMORY_SOURCED_WRITES + L1D_ONCLUSTER_MEMORY_SOURCED_WRITES + L1D_OFFCLUSTER_MEMORY_SOURCED_WRITES + L1D_OFFDRAWER_MEMORY_SOURCED_WRITES + L1I_ONCHIP_MEMORY_SOURCED_WRITES + L1I_ONCLUSTER_MEMORY_SOURCED_WRITES + L1I_OFFCLUSTER_MEMORY_SOURCED_WRITES + L1I_OFFDRAWER_MEMORY_SOURCED_WRITES) / (L1I_DIR_WRITES + L1D_DIR_WRITES)) * 100"
  },
  {
    "BriefDescription": "Cycles per Instructions from Finite cache/memory",
    "MetricName": "finite_cpi",
    "MetricExpr": "L1C_TLB2_MISSES / INSTRUCTIONS"
  },
  {
    "BriefDescription": "Estimated Instruction Complexity CPI infinite Level 1",
    "MetricName": "est_cpi",
    "MetricExpr": "(CPU_CYCLES / INSTRUCTIONS) - (L1C_TLB2_MISSES / INSTRUCTIONS)"
  },
  {
    "BriefDescription": "Estimated Sourcing Cycles per Level 1 Miss",
    "MetricName": "scpl1m",
    "MetricExpr": "L1C_TLB2_MISSES / (L1I_DIR_WRITES + L1D_DIR_WRITES)"
  },
  {
    "BriefDescription": "Estimated TLB CPU percentage of Total CPU",
    "MetricName": "tlb_percent",
    "MetricExpr": "((DTLB2_MISSES + ITLB2_MISSES) / CPU_CYCLES) * (L1C_TLB2_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES)) * 100"
  },
  {
    "BriefDescription": "Estimated Cycles per TLB Miss",
    "MetricName": "tlb_miss",
    "MetricExpr": "((DTLB2_MISSES + ITLB2_MISSES) / (DTLB2_WRITES + ITLB2_WRITES)) * (L1C_TLB2_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES))"
  }
]
+25 −0
Original line number Diff line number Diff line
@@ -43,5 +43,30 @@
    "BriefDescription": "Percentage sourced from memory",
    "MetricName": "memp",
    "MetricExpr": "((DCW_ON_CHIP_MEMORY + DCW_ON_MODULE_MEMORY + DCW_ON_DRAWER_MEMORY + DCW_OFF_DRAWER_MEMORY + ICW_ON_CHIP_MEMORY + ICW_ON_MODULE_MEMORY + ICW_ON_DRAWER_MEMORY + ICW_OFF_DRAWER_MEMORY) / (L1I_DIR_WRITES + L1D_DIR_WRITES)) * 100"
  },
  {
    "BriefDescription": "Cycles per Instructions from Finite cache/memory",
    "MetricName": "finite_cpi",
    "MetricExpr": "L1C_TLB2_MISSES / INSTRUCTIONS"
  },
  {
    "BriefDescription": "Estimated Instruction Complexity CPI infinite Level 1",
    "MetricName": "est_cpi",
    "MetricExpr": "(CPU_CYCLES / INSTRUCTIONS) - (L1C_TLB2_MISSES / INSTRUCTIONS)"
  },
  {
    "BriefDescription": "Estimated Sourcing Cycles per Level 1 Miss",
    "MetricName": "scpl1m",
    "MetricExpr": "L1C_TLB2_MISSES / (L1I_DIR_WRITES + L1D_DIR_WRITES)"
  },
  {
    "BriefDescription": "Estimated TLB CPU percentage of Total CPU",
    "MetricName": "tlb_percent",
    "MetricExpr": "((DTLB2_MISSES + ITLB2_MISSES) / CPU_CYCLES) * (L1C_TLB2_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES)) * 100"
  },
  {
    "BriefDescription": "Estimated Cycles per TLB Miss",
    "MetricName": "tlb_miss",
    "MetricExpr": "((DTLB2_MISSES + ITLB2_MISSES) / (DTLB2_WRITES + ITLB2_WRITES)) * (L1C_TLB2_MISSES / (L1I_PENALTY_CYCLES + L1D_PENALTY_CYCLES))"
  }
]