BACKPORT: arm64: hw_breakpoint: Handle inexact watchpoint addresses
authorPavel Labath <test.tberghammer@gmail.com>
Mon, 14 Nov 2016 14:02:44 +0000 (19:32 +0530)
committerAmit Pundir <amit.pundir@linaro.org>
Mon, 10 Apr 2017 07:42:16 +0000 (13:12 +0530)
(cherry picked from commit fdfeff0f9e3d9be2b68fa02566017ffc581ae17b)

Arm64 hardware does not always report a watchpoint hit address that
matches one of the watchpoints set. It can also report an address
"near" the watchpoint if a single instruction access both watched and
unwatched addresses. There is no straight-forward way, short of
disassembling the offending instruction, to map that address back to
the watchpoint.

Previously, when the hardware reported a watchpoint hit on an address
that did not match our watchpoint (this happens in case of instructions
which access large chunks of memory such as "stp") the process would
enter a loop where we would be continually resuming it (because we did
not recognise that watchpoint hit) and it would keep hitting the
watchpoint again and again. The tracing process would never get
notified of the watchpoint hit.

This commit fixes the problem by looking at the watchpoints near the
address reported by the hardware. If the address does not exactly match
one of the watchpoints we have set, it attributes the hit to the
nearest watchpoint we have.  This heuristic is a bit dodgy, but I don't
think we can do much more, given the hardware limitations.

Signed-off-by: Pavel Labath <labath@google.com>
[panand: reworked to rebase on his patches]
Signed-off-by: Pratyush Anand <panand@redhat.com>
[will: use __ffs instead of ffs - 1]
Signed-off-by: Will Deacon <will.deacon@arm.com>
Signed-off-by: Pavel Labath <labath@google.com>
[pavel: trivial fixup in hw_breakpoint.c:watchpoint_handler]
Change-Id: I714dfaa3947d89d89a9e9a1ea84914d44ba0faa3
Bug: 30919905

arch/arm64/kernel/hw_breakpoint.c

index 1f4fc5364a472e44f9368d46719015f7fe767f6b..3730b1fb3344f32dfffce987b275f8f4a9563aa4 100644 (file)
@@ -664,11 +664,46 @@ unlock:
 }
 NOKPROBE_SYMBOL(breakpoint_handler);
 
+/*
+ * Arm64 hardware does not always report a watchpoint hit address that matches
+ * one of the watchpoints set. It can also report an address "near" the
+ * watchpoint if a single instruction access both watched and unwatched
+ * addresses. There is no straight-forward way, short of disassembling the
+ * offending instruction, to map that address back to the watchpoint. This
+ * function computes the distance of the memory access from the watchpoint as a
+ * heuristic for the likelyhood that a given access triggered the watchpoint.
+ *
+ * See Section D2.10.5 "Determining the memory location that caused a Watchpoint
+ * exception" of ARMv8 Architecture Reference Manual for details.
+ *
+ * The function returns the distance of the address from the bytes watched by
+ * the watchpoint. In case of an exact match, it returns 0.
+ */
+static u64 get_distance_from_watchpoint(unsigned long addr, u64 val,
+                                       struct arch_hw_breakpoint_ctrl *ctrl)
+{
+       u64 wp_low, wp_high;
+       u32 lens, lene;
+
+       lens = __ffs(ctrl->len);
+       lene = __fls(ctrl->len);
+
+       wp_low = val + lens;
+       wp_high = val + lene;
+       if (addr < wp_low)
+               return wp_low - addr;
+       else if (addr > wp_high)
+               return addr - wp_high;
+       else
+               return 0;
+}
+
 static int watchpoint_handler(unsigned long addr, unsigned int esr,
                              struct pt_regs *regs)
 {
-       int i, step = 0, *kernel_step, access;
-       u32 ctrl_reg, lens, lene;
+       int i, step = 0, *kernel_step, access, closest_match = 0;
+       u64 min_dist = -1, dist;
+       u32 ctrl_reg;
        u64 val;
        struct perf_event *wp, **slots;
        struct debug_info *debug_info;
@@ -678,31 +713,15 @@ static int watchpoint_handler(unsigned long addr, unsigned int esr,
        slots = this_cpu_ptr(wp_on_reg);
        debug_info = &current->thread.debug;
 
+       /*
+        * Find all watchpoints that match the reported address. If no exact
+        * match is found. Attribute the hit to the closest watchpoint.
+        */
+       rcu_read_lock();
        for (i = 0; i < core_num_wrps; ++i) {
-               rcu_read_lock();
-
                wp = slots[i];
-
                if (wp == NULL)
-                       goto unlock;
-
-               info = counter_arch_bp(wp);
-
-               /* Check if the watchpoint value and byte select match. */
-               val = read_wb_reg(AARCH64_DBG_REG_WVR, i);
-               ctrl_reg = read_wb_reg(AARCH64_DBG_REG_WCR, i);
-               decode_ctrl_reg(ctrl_reg, &ctrl);
-               lens = ffs(ctrl.len) - 1;
-               lene = fls(ctrl.len) - 1;
-               /*
-                * FIXME: reported address can be anywhere between "the
-                * lowest address accessed by the memory access that
-                * triggered the watchpoint" and "the highest watchpointed
-                * address accessed by the memory access". So, it may not
-                * lie in the interval of watchpoint address range.
-                */
-               if (addr < val + lens || addr > val + lene)
-                       goto unlock;
+                       continue;
 
                /*
                 * Check that the access type matches.
@@ -711,18 +730,41 @@ static int watchpoint_handler(unsigned long addr, unsigned int esr,
                access = (esr & AARCH64_ESR_ACCESS_MASK) ? HW_BREAKPOINT_W :
                         HW_BREAKPOINT_R;
                if (!(access & hw_breakpoint_type(wp)))
-                       goto unlock;
+                       continue;
 
+               /* Check if the watchpoint value and byte select match. */
+               val = read_wb_reg(AARCH64_DBG_REG_WVR, i);
+               ctrl_reg = read_wb_reg(AARCH64_DBG_REG_WCR, i);
+               decode_ctrl_reg(ctrl_reg, &ctrl);
+               dist = get_distance_from_watchpoint(addr, val, &ctrl);
+               if (dist < min_dist) {
+                       min_dist = dist;
+                       closest_match = i;
+               }
+               /* Is this an exact match? */
+               if (dist != 0)
+                       continue;
+
+               info = counter_arch_bp(wp);
                info->trigger = addr;
                perf_bp_event(wp, regs);
 
                /* Do we need to handle the stepping? */
                if (!wp->overflow_handler)
                        step = 1;
+       }
+       if (min_dist > 0 && min_dist != -1) {
+               /* No exact match found. */
+               wp = slots[closest_match];
+               info = counter_arch_bp(wp);
+               info->trigger = addr;
+               perf_bp_event(wp, regs);
 
-unlock:
-               rcu_read_unlock();
+               /* Do we need to handle the stepping? */
+               if (!wp->overflow_handler)
+                       step = 1;
        }
+       rcu_read_unlock();
 
        if (!step)
                return 0;