sh: perf events: Add support for SH7750-style counters.
authorPaul Mundt <lethal@linux-sh.org>
Thu, 5 Nov 2009 08:02:03 +0000 (17:02 +0900)
committerPaul Mundt <lethal@linux-sh.org>
Thu, 5 Nov 2009 08:02:03 +0000 (17:02 +0900)
This adds perf events support for the SH7750/SH7750S/SH7091 performance
counters.

Signed-off-by: Paul Mundt <lethal@linux-sh.org>
arch/sh/kernel/cpu/sh4/Makefile
arch/sh/kernel/cpu/sh4/perf_event.c [new file with mode: 0644]

index 203b18347b831e2d2b63d3b0df06f2f7d7af1b20..c39c1235db91346a0c98203eea6c99e454b92f2f 100644 (file)
@@ -9,6 +9,11 @@ obj-$(CONFIG_HIBERNATION)              += $(addprefix ../sh3/, swsusp.o)
 obj-$(CONFIG_SH_FPU)                   += fpu.o softfloat.o
 obj-$(CONFIG_SH_STORE_QUEUES)          += sq.o
 
+# Perf events
+obj-$(CONFIG_CPU_SUBTYPE_SH7750)       += perf_event.o
+obj-$(CONFIG_CPU_SUBTYPE_SH7750S)      += perf_event.o
+obj-$(CONFIG_CPU_SUBTYPE_SH7091)       += perf_event.o
+
 # CPU subtype setup
 obj-$(CONFIG_CPU_SUBTYPE_SH7750)       += setup-sh7750.o
 obj-$(CONFIG_CPU_SUBTYPE_SH7750R)      += setup-sh7750.o
diff --git a/arch/sh/kernel/cpu/sh4/perf_event.c b/arch/sh/kernel/cpu/sh4/perf_event.c
new file mode 100644 (file)
index 0000000..7f9ecc9
--- /dev/null
@@ -0,0 +1,253 @@
+/*
+ * Performance events support for SH7750-style performance counters
+ *
+ *  Copyright (C) 2009  Paul Mundt
+ *
+ * This file is subject to the terms and conditions of the GNU General Public
+ * License.  See the file "COPYING" in the main directory of this archive
+ * for more details.
+ */
+#include <linux/kernel.h>
+#include <linux/init.h>
+#include <linux/io.h>
+#include <linux/irq.h>
+#include <linux/perf_event.h>
+#include <asm/processor.h>
+
+#define PM_CR_BASE     0xff000084      /* 16-bit */
+#define PM_CTR_BASE    0xff100004      /* 32-bit */
+
+#define PMCR(n)                (PM_CR_BASE + ((n) * 0x04))
+#define PMCTRH(n)      (PM_CTR_BASE + 0x00 + ((n) * 0x08))
+#define PMCTRL(n)      (PM_CTR_BASE + 0x04 + ((n) * 0x08))
+
+#define PMCR_PMM_MASK  0x0000003f
+
+#define PMCR_CLKF      0x00000100
+#define PMCR_PMCLR     0x00002000
+#define PMCR_PMST      0x00004000
+#define PMCR_PMEN      0x00008000
+
+static struct sh_pmu sh7750_pmu;
+
+/*
+ * There are a number of events supported by each counter (33 in total).
+ * Since we have 2 counters, each counter will take the event code as it
+ * corresponds to the PMCR PMM setting. Each counter can be configured
+ * independently.
+ *
+ *     Event Code      Description
+ *     ----------      -----------
+ *
+ *     0x01            Operand read access
+ *     0x02            Operand write access
+ *     0x03            UTLB miss
+ *     0x04            Operand cache read miss
+ *     0x05            Operand cache write miss
+ *     0x06            Instruction fetch (w/ cache)
+ *     0x07            Instruction TLB miss
+ *     0x08            Instruction cache miss
+ *     0x09            All operand accesses
+ *     0x0a            All instruction accesses
+ *     0x0b            OC RAM operand access
+ *     0x0d            On-chip I/O space access
+ *     0x0e            Operand access (r/w)
+ *     0x0f            Operand cache miss (r/w)
+ *     0x10            Branch instruction
+ *     0x11            Branch taken
+ *     0x12            BSR/BSRF/JSR
+ *     0x13            Instruction execution
+ *     0x14            Instruction execution in parallel
+ *     0x15            FPU Instruction execution
+ *     0x16            Interrupt
+ *     0x17            NMI
+ *     0x18            trapa instruction execution
+ *     0x19            UBCA match
+ *     0x1a            UBCB match
+ *     0x21            Instruction cache fill
+ *     0x22            Operand cache fill
+ *     0x23            Elapsed time
+ *     0x24            Pipeline freeze by I-cache miss
+ *     0x25            Pipeline freeze by D-cache miss
+ *     0x27            Pipeline freeze by branch instruction
+ *     0x28            Pipeline freeze by CPU register
+ *     0x29            Pipeline freeze by FPU
+ */
+
+static const int sh7750_general_events[] = {
+       [PERF_COUNT_HW_CPU_CYCLES]              = 0x0023,
+       [PERF_COUNT_HW_INSTRUCTIONS]            = 0x000a,
+       [PERF_COUNT_HW_CACHE_REFERENCES]        = 0x0006,       /* I-cache */
+       [PERF_COUNT_HW_CACHE_MISSES]            = 0x0008,       /* I-cache */
+       [PERF_COUNT_HW_BRANCH_INSTRUCTIONS]     = 0x0010,
+       [PERF_COUNT_HW_BRANCH_MISSES]           = -1,
+       [PERF_COUNT_HW_BUS_CYCLES]              = -1,
+};
+
+#define C(x)   PERF_COUNT_HW_CACHE_##x
+
+static const int sh7750_cache_events
+                       [PERF_COUNT_HW_CACHE_MAX]
+                       [PERF_COUNT_HW_CACHE_OP_MAX]
+                       [PERF_COUNT_HW_CACHE_RESULT_MAX] =
+{
+       [ C(L1D) ] = {
+               [ C(OP_READ) ] = {
+                       [ C(RESULT_ACCESS) ] = 0x0001,
+                       [ C(RESULT_MISS)   ] = 0x0004,
+               },
+               [ C(OP_WRITE) ] = {
+                       [ C(RESULT_ACCESS) ] = 0x0002,
+                       [ C(RESULT_MISS)   ] = 0x0005,
+               },
+               [ C(OP_PREFETCH) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+       },
+
+       [ C(L1I) ] = {
+               [ C(OP_READ) ] = {
+                       [ C(RESULT_ACCESS) ] = 0x0006,
+                       [ C(RESULT_MISS)   ] = 0x0008,
+               },
+               [ C(OP_WRITE) ] = {
+                       [ C(RESULT_ACCESS) ] = -1,
+                       [ C(RESULT_MISS)   ] = -1,
+               },
+               [ C(OP_PREFETCH) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+       },
+
+       [ C(LL) ] = {
+               [ C(OP_READ) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+               [ C(OP_WRITE) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+               [ C(OP_PREFETCH) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+       },
+
+       [ C(DTLB) ] = {
+               [ C(OP_READ) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0x0003,
+               },
+               [ C(OP_WRITE) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+               [ C(OP_PREFETCH) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0,
+               },
+       },
+
+       [ C(ITLB) ] = {
+               [ C(OP_READ) ] = {
+                       [ C(RESULT_ACCESS) ] = 0,
+                       [ C(RESULT_MISS)   ] = 0x0007,
+               },
+               [ C(OP_WRITE) ] = {
+                       [ C(RESULT_ACCESS) ] = -1,
+                       [ C(RESULT_MISS)   ] = -1,
+               },
+               [ C(OP_PREFETCH) ] = {
+                       [ C(RESULT_ACCESS) ] = -1,
+                       [ C(RESULT_MISS)   ] = -1,
+               },
+       },
+
+       [ C(BPU) ] = {
+               [ C(OP_READ) ] = {
+                       [ C(RESULT_ACCESS) ] = -1,
+                       [ C(RESULT_MISS)   ] = -1,
+               },
+               [ C(OP_WRITE) ] = {
+                       [ C(RESULT_ACCESS) ] = -1,
+                       [ C(RESULT_MISS)   ] = -1,
+               },
+               [ C(OP_PREFETCH) ] = {
+                       [ C(RESULT_ACCESS) ] = -1,
+                       [ C(RESULT_MISS)   ] = -1,
+               },
+       },
+};
+
+static int sh7750_event_map(int event)
+{
+       return sh7750_general_events[event];
+}
+
+static u64 sh7750_pmu_read(int idx)
+{
+       return (u64)((u64)(__raw_readl(PMCTRH(idx)) & 0xffff) << 32) |
+                          __raw_readl(PMCTRL(idx));
+}
+
+static void sh7750_pmu_disable(struct hw_perf_event *hwc, int idx)
+{
+       unsigned int tmp;
+
+       tmp = __raw_readw(PMCR(idx));
+       tmp &= ~(PMCR_PMM_MASK | PMCR_PMEN);
+       __raw_writew(tmp, PMCR(idx));
+}
+
+static void sh7750_pmu_enable(struct hw_perf_event *hwc, int idx)
+{
+       __raw_writew(__raw_readw(PMCR(idx)) | PMCR_PMCLR, PMCR(idx));
+       __raw_writew(hwc->config | PMCR_PMEN | PMCR_PMST, PMCR(idx));
+}
+
+static void sh7750_pmu_disable_all(void)
+{
+       int i;
+
+       for (i = 0; i < sh7750_pmu.num_events; i++)
+               __raw_writew(__raw_readw(PMCR(i)) & ~PMCR_PMEN, PMCR(i));
+}
+
+static void sh7750_pmu_enable_all(void)
+{
+       int i;
+
+       for (i = 0; i < sh7750_pmu.num_events; i++)
+               __raw_writew(__raw_readw(PMCR(i)) | PMCR_PMEN, PMCR(i));
+}
+
+static struct sh_pmu sh7750_pmu = {
+       .name           = "SH7750",
+       .num_events     = 2,
+       .event_map      = sh7750_event_map,
+       .max_events     = ARRAY_SIZE(sh7750_general_events),
+       .raw_event_mask = PMCR_PMM_MASK,
+       .cache_events   = &sh7750_cache_events,
+       .read           = sh7750_pmu_read,
+       .disable        = sh7750_pmu_disable,
+       .enable         = sh7750_pmu_enable,
+       .disable_all    = sh7750_pmu_disable_all,
+       .enable_all     = sh7750_pmu_enable_all,
+};
+
+static int __init sh7750_pmu_init(void)
+{
+       /*
+        * Make sure this CPU actually has perf counters.
+        */
+       if (!(boot_cpu_data.flags & CPU_HAS_PERF_COUNTER)) {
+               pr_notice("HW perf events unsupported, software events only.\n");
+               return -ENODEV;
+       }
+
+       return register_sh_pmu(&sh7750_pmu);
+}
+arch_initcall(sh7750_pmu_init);