arm64: Allow hw watchpoint at varied offset from base address
authorPratyush Anand <panand@redhat.com>
Mon, 14 Nov 2016 14:02:43 +0000 (19:32 +0530)
committerWill Deacon <will.deacon@arm.com>
Fri, 18 Nov 2016 17:23:17 +0000 (17:23 +0000)
ARM64 hardware supports watchpoint at any double word aligned address.
However, it can select any consecutive bytes from offset 0 to 7 from that
base address. For example, if base address is programmed as 0x420030 and
byte select is 0x1C, then access of 0x420032,0x420033 and 0x420034 will
generate a watchpoint exception.

Currently, we do not have such modularity. We can only program byte,
halfword, word and double word access exception from any base address.

This patch adds support to overcome above limitations.

Signed-off-by: Pratyush Anand <panand@redhat.com>
Signed-off-by: Will Deacon <will.deacon@arm.com>
arch/arm64/include/asm/hw_breakpoint.h
arch/arm64/kernel/hw_breakpoint.c
arch/arm64/kernel/ptrace.c

index 9510ace570e29b1a0991bdfd04351f755a62dd69..d1c3b06ad307160c29585bd92a47ccfc70cbcfb5 100644 (file)
@@ -119,7 +119,7 @@ struct perf_event;
 struct pmu;
 
 extern int arch_bp_generic_fields(struct arch_hw_breakpoint_ctrl ctrl,
-                                 int *gen_len, int *gen_type);
+                                 int *gen_len, int *gen_type, int *offset);
 extern int arch_check_bp_in_kernelspace(struct perf_event *bp);
 extern int arch_validate_hwbkpt_settings(struct perf_event *bp);
 extern int hw_breakpoint_exceptions_notify(struct notifier_block *unused,
index 948b73148d56750be242120b5f0191b3a13ef8f3..3f7bc65e7ef614b4b64ac9aed1a0f07bc865f0c4 100644 (file)
@@ -349,7 +349,7 @@ int arch_check_bp_in_kernelspace(struct perf_event *bp)
  * to generic breakpoint descriptions.
  */
 int arch_bp_generic_fields(struct arch_hw_breakpoint_ctrl ctrl,
-                          int *gen_len, int *gen_type)
+                          int *gen_len, int *gen_type, int *offset)
 {
        /* Type */
        switch (ctrl.type) {
@@ -369,8 +369,12 @@ int arch_bp_generic_fields(struct arch_hw_breakpoint_ctrl ctrl,
                return -EINVAL;
        }
 
+       if (!ctrl.len)
+               return -EINVAL;
+       *offset = __ffs(ctrl.len);
+
        /* Len */
-       switch (ctrl.len) {
+       switch (ctrl.len >> *offset) {
        case ARM_BREAKPOINT_LEN_1:
                *gen_len = HW_BREAKPOINT_LEN_1;
                break;
@@ -517,18 +521,17 @@ int arch_validate_hwbkpt_settings(struct perf_event *bp)
                default:
                        return -EINVAL;
                }
-
-               info->address &= ~alignment_mask;
-               info->ctrl.len <<= offset;
        } else {
                if (info->ctrl.type == ARM_BREAKPOINT_EXECUTE)
                        alignment_mask = 0x3;
                else
                        alignment_mask = 0x7;
-               if (info->address & alignment_mask)
-                       return -EINVAL;
+               offset = info->address & alignment_mask;
        }
 
+       info->address &= ~alignment_mask;
+       info->ctrl.len <<= offset;
+
        /*
         * Disallow per-task kernel breakpoints since these would
         * complicate the stepping code.
@@ -665,8 +668,8 @@ static int watchpoint_handler(unsigned long addr, unsigned int esr,
                              struct pt_regs *regs)
 {
        int i, step = 0, *kernel_step, access;
-       u32 ctrl_reg;
-       u64 val, alignment_mask;
+       u32 ctrl_reg, lens, lene;
+       u64 val;
        struct perf_event *wp, **slots;
        struct debug_info *debug_info;
        struct arch_hw_breakpoint *info;
@@ -684,25 +687,21 @@ static int watchpoint_handler(unsigned long addr, unsigned int esr,
                        goto unlock;
 
                info = counter_arch_bp(wp);
-               /* AArch32 watchpoints are either 4 or 8 bytes aligned. */
-               if (is_compat_task()) {
-                       if (info->ctrl.len == ARM_BREAKPOINT_LEN_8)
-                               alignment_mask = 0x7;
-                       else
-                               alignment_mask = 0x3;
-               } else {
-                       alignment_mask = 0x7;
-               }
 
-               /* Check if the watchpoint value matches. */
+               /* Check if the watchpoint value and byte select match. */
                val = read_wb_reg(AARCH64_DBG_REG_WVR, i);
-               if (val != (addr & ~alignment_mask))
-                       goto unlock;
-
-               /* Possible match, check the byte address select to confirm. */
                ctrl_reg = read_wb_reg(AARCH64_DBG_REG_WCR, i);
                decode_ctrl_reg(ctrl_reg, &ctrl);
-               if (!((1 << (addr & alignment_mask)) & ctrl.len))
+               lens = ffs(ctrl.len) - 1;
+               lene = fls(ctrl.len) - 1;
+               /*
+                * FIXME: reported address can be anywhere between "the
+                * lowest address accessed by the memory access that
+                * triggered the watchpoint" and "the highest watchpointed
+                * address accessed by the memory access". So, it may not
+                * lie in the interval of watchpoint address range.
+                */
+               if (addr < val + lens || addr > val + lene)
                        goto unlock;
 
                /*
index e0c81da60f76270ad122fee3595464852e7d9ee2..fc35e06ccaaca863ad680ff09166c3f2ba034c54 100644 (file)
@@ -327,13 +327,13 @@ static int ptrace_hbp_fill_attr_ctrl(unsigned int note_type,
                                     struct arch_hw_breakpoint_ctrl ctrl,
                                     struct perf_event_attr *attr)
 {
-       int err, len, type, disabled = !ctrl.enabled;
+       int err, len, type, offset, disabled = !ctrl.enabled;
 
        attr->disabled = disabled;
        if (disabled)
                return 0;
 
-       err = arch_bp_generic_fields(ctrl, &len, &type);
+       err = arch_bp_generic_fields(ctrl, &len, &type, &offset);
        if (err)
                return err;
 
@@ -352,6 +352,7 @@ static int ptrace_hbp_fill_attr_ctrl(unsigned int note_type,
 
        attr->bp_len    = len;
        attr->bp_type   = type;
+       attr->bp_addr   += offset;
 
        return 0;
 }
@@ -404,7 +405,7 @@ static int ptrace_hbp_get_addr(unsigned int note_type,
        if (IS_ERR(bp))
                return PTR_ERR(bp);
 
-       *addr = bp ? bp->attr.bp_addr : 0;
+       *addr = bp ? counter_arch_bp(bp)->address : 0;
        return 0;
 }