GNU Linux-libre 4.19.295-gnu1
[releases.git] / arch / arm64 / kernel / hw_breakpoint.c
1 /*
2  * HW_breakpoint: a unified kernel/user-space hardware breakpoint facility,
3  * using the CPU's debug registers.
4  *
5  * Copyright (C) 2012 ARM Limited
6  * Author: Will Deacon <will.deacon@arm.com>
7  *
8  * This program is free software; you can redistribute it and/or modify
9  * it under the terms of the GNU General Public License version 2 as
10  * published by the Free Software Foundation.
11  *
12  * This program is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15  * GNU General Public License for more details.
16  *
17  * You should have received a copy of the GNU General Public License
18  * along with this program.  If not, see <http://www.gnu.org/licenses/>.
19  */
20
21 #define pr_fmt(fmt) "hw-breakpoint: " fmt
22
23 #include <linux/compat.h>
24 #include <linux/cpu_pm.h>
25 #include <linux/errno.h>
26 #include <linux/hw_breakpoint.h>
27 #include <linux/kprobes.h>
28 #include <linux/perf_event.h>
29 #include <linux/ptrace.h>
30 #include <linux/smp.h>
31 #include <linux/uaccess.h>
32
33 #include <asm/current.h>
34 #include <asm/debug-monitors.h>
35 #include <asm/hw_breakpoint.h>
36 #include <asm/traps.h>
37 #include <asm/cputype.h>
38 #include <asm/system_misc.h>
39
40 /* Breakpoint currently in use for each BRP. */
41 static DEFINE_PER_CPU(struct perf_event *, bp_on_reg[ARM_MAX_BRP]);
42
43 /* Watchpoint currently in use for each WRP. */
44 static DEFINE_PER_CPU(struct perf_event *, wp_on_reg[ARM_MAX_WRP]);
45
46 /* Currently stepping a per-CPU kernel breakpoint. */
47 static DEFINE_PER_CPU(int, stepping_kernel_bp);
48
49 /* Number of BRP/WRP registers on this CPU. */
50 static int core_num_brps;
51 static int core_num_wrps;
52
53 int hw_breakpoint_slots(int type)
54 {
55         /*
56          * We can be called early, so don't rely on
57          * our static variables being initialised.
58          */
59         switch (type) {
60         case TYPE_INST:
61                 return get_num_brps();
62         case TYPE_DATA:
63                 return get_num_wrps();
64         default:
65                 pr_warning("unknown slot type: %d\n", type);
66                 return 0;
67         }
68 }
69
70 #define READ_WB_REG_CASE(OFF, N, REG, VAL)      \
71         case (OFF + N):                         \
72                 AARCH64_DBG_READ(N, REG, VAL);  \
73                 break
74
75 #define WRITE_WB_REG_CASE(OFF, N, REG, VAL)     \
76         case (OFF + N):                         \
77                 AARCH64_DBG_WRITE(N, REG, VAL); \
78                 break
79
80 #define GEN_READ_WB_REG_CASES(OFF, REG, VAL)    \
81         READ_WB_REG_CASE(OFF,  0, REG, VAL);    \
82         READ_WB_REG_CASE(OFF,  1, REG, VAL);    \
83         READ_WB_REG_CASE(OFF,  2, REG, VAL);    \
84         READ_WB_REG_CASE(OFF,  3, REG, VAL);    \
85         READ_WB_REG_CASE(OFF,  4, REG, VAL);    \
86         READ_WB_REG_CASE(OFF,  5, REG, VAL);    \
87         READ_WB_REG_CASE(OFF,  6, REG, VAL);    \
88         READ_WB_REG_CASE(OFF,  7, REG, VAL);    \
89         READ_WB_REG_CASE(OFF,  8, REG, VAL);    \
90         READ_WB_REG_CASE(OFF,  9, REG, VAL);    \
91         READ_WB_REG_CASE(OFF, 10, REG, VAL);    \
92         READ_WB_REG_CASE(OFF, 11, REG, VAL);    \
93         READ_WB_REG_CASE(OFF, 12, REG, VAL);    \
94         READ_WB_REG_CASE(OFF, 13, REG, VAL);    \
95         READ_WB_REG_CASE(OFF, 14, REG, VAL);    \
96         READ_WB_REG_CASE(OFF, 15, REG, VAL)
97
98 #define GEN_WRITE_WB_REG_CASES(OFF, REG, VAL)   \
99         WRITE_WB_REG_CASE(OFF,  0, REG, VAL);   \
100         WRITE_WB_REG_CASE(OFF,  1, REG, VAL);   \
101         WRITE_WB_REG_CASE(OFF,  2, REG, VAL);   \
102         WRITE_WB_REG_CASE(OFF,  3, REG, VAL);   \
103         WRITE_WB_REG_CASE(OFF,  4, REG, VAL);   \
104         WRITE_WB_REG_CASE(OFF,  5, REG, VAL);   \
105         WRITE_WB_REG_CASE(OFF,  6, REG, VAL);   \
106         WRITE_WB_REG_CASE(OFF,  7, REG, VAL);   \
107         WRITE_WB_REG_CASE(OFF,  8, REG, VAL);   \
108         WRITE_WB_REG_CASE(OFF,  9, REG, VAL);   \
109         WRITE_WB_REG_CASE(OFF, 10, REG, VAL);   \
110         WRITE_WB_REG_CASE(OFF, 11, REG, VAL);   \
111         WRITE_WB_REG_CASE(OFF, 12, REG, VAL);   \
112         WRITE_WB_REG_CASE(OFF, 13, REG, VAL);   \
113         WRITE_WB_REG_CASE(OFF, 14, REG, VAL);   \
114         WRITE_WB_REG_CASE(OFF, 15, REG, VAL)
115
116 static u64 read_wb_reg(int reg, int n)
117 {
118         u64 val = 0;
119
120         switch (reg + n) {
121         GEN_READ_WB_REG_CASES(AARCH64_DBG_REG_BVR, AARCH64_DBG_REG_NAME_BVR, val);
122         GEN_READ_WB_REG_CASES(AARCH64_DBG_REG_BCR, AARCH64_DBG_REG_NAME_BCR, val);
123         GEN_READ_WB_REG_CASES(AARCH64_DBG_REG_WVR, AARCH64_DBG_REG_NAME_WVR, val);
124         GEN_READ_WB_REG_CASES(AARCH64_DBG_REG_WCR, AARCH64_DBG_REG_NAME_WCR, val);
125         default:
126                 pr_warning("attempt to read from unknown breakpoint register %d\n", n);
127         }
128
129         return val;
130 }
131 NOKPROBE_SYMBOL(read_wb_reg);
132
133 static void write_wb_reg(int reg, int n, u64 val)
134 {
135         switch (reg + n) {
136         GEN_WRITE_WB_REG_CASES(AARCH64_DBG_REG_BVR, AARCH64_DBG_REG_NAME_BVR, val);
137         GEN_WRITE_WB_REG_CASES(AARCH64_DBG_REG_BCR, AARCH64_DBG_REG_NAME_BCR, val);
138         GEN_WRITE_WB_REG_CASES(AARCH64_DBG_REG_WVR, AARCH64_DBG_REG_NAME_WVR, val);
139         GEN_WRITE_WB_REG_CASES(AARCH64_DBG_REG_WCR, AARCH64_DBG_REG_NAME_WCR, val);
140         default:
141                 pr_warning("attempt to write to unknown breakpoint register %d\n", n);
142         }
143         isb();
144 }
145 NOKPROBE_SYMBOL(write_wb_reg);
146
147 /*
148  * Convert a breakpoint privilege level to the corresponding exception
149  * level.
150  */
151 static enum dbg_active_el debug_exception_level(int privilege)
152 {
153         switch (privilege) {
154         case AARCH64_BREAKPOINT_EL0:
155                 return DBG_ACTIVE_EL0;
156         case AARCH64_BREAKPOINT_EL1:
157                 return DBG_ACTIVE_EL1;
158         default:
159                 pr_warning("invalid breakpoint privilege level %d\n", privilege);
160                 return -EINVAL;
161         }
162 }
163 NOKPROBE_SYMBOL(debug_exception_level);
164
165 enum hw_breakpoint_ops {
166         HW_BREAKPOINT_INSTALL,
167         HW_BREAKPOINT_UNINSTALL,
168         HW_BREAKPOINT_RESTORE
169 };
170
171 static int is_compat_bp(struct perf_event *bp)
172 {
173         struct task_struct *tsk = bp->hw.target;
174
175         /*
176          * tsk can be NULL for per-cpu (non-ptrace) breakpoints.
177          * In this case, use the native interface, since we don't have
178          * the notion of a "compat CPU" and could end up relying on
179          * deprecated behaviour if we use unaligned watchpoints in
180          * AArch64 state.
181          */
182         return tsk && is_compat_thread(task_thread_info(tsk));
183 }
184
185 /**
186  * hw_breakpoint_slot_setup - Find and setup a perf slot according to
187  *                            operations
188  *
189  * @slots: pointer to array of slots
190  * @max_slots: max number of slots
191  * @bp: perf_event to setup
192  * @ops: operation to be carried out on the slot
193  *
194  * Return:
195  *      slot index on success
196  *      -ENOSPC if no slot is available/matches
197  *      -EINVAL on wrong operations parameter
198  */
199 static int hw_breakpoint_slot_setup(struct perf_event **slots, int max_slots,
200                                     struct perf_event *bp,
201                                     enum hw_breakpoint_ops ops)
202 {
203         int i;
204         struct perf_event **slot;
205
206         for (i = 0; i < max_slots; ++i) {
207                 slot = &slots[i];
208                 switch (ops) {
209                 case HW_BREAKPOINT_INSTALL:
210                         if (!*slot) {
211                                 *slot = bp;
212                                 return i;
213                         }
214                         break;
215                 case HW_BREAKPOINT_UNINSTALL:
216                         if (*slot == bp) {
217                                 *slot = NULL;
218                                 return i;
219                         }
220                         break;
221                 case HW_BREAKPOINT_RESTORE:
222                         if (*slot == bp)
223                                 return i;
224                         break;
225                 default:
226                         pr_warn_once("Unhandled hw breakpoint ops %d\n", ops);
227                         return -EINVAL;
228                 }
229         }
230         return -ENOSPC;
231 }
232
233 static int hw_breakpoint_control(struct perf_event *bp,
234                                  enum hw_breakpoint_ops ops)
235 {
236         struct arch_hw_breakpoint *info = counter_arch_bp(bp);
237         struct perf_event **slots;
238         struct debug_info *debug_info = &current->thread.debug;
239         int i, max_slots, ctrl_reg, val_reg, reg_enable;
240         enum dbg_active_el dbg_el = debug_exception_level(info->ctrl.privilege);
241         u32 ctrl;
242
243         if (info->ctrl.type == ARM_BREAKPOINT_EXECUTE) {
244                 /* Breakpoint */
245                 ctrl_reg = AARCH64_DBG_REG_BCR;
246                 val_reg = AARCH64_DBG_REG_BVR;
247                 slots = this_cpu_ptr(bp_on_reg);
248                 max_slots = core_num_brps;
249                 reg_enable = !debug_info->bps_disabled;
250         } else {
251                 /* Watchpoint */
252                 ctrl_reg = AARCH64_DBG_REG_WCR;
253                 val_reg = AARCH64_DBG_REG_WVR;
254                 slots = this_cpu_ptr(wp_on_reg);
255                 max_slots = core_num_wrps;
256                 reg_enable = !debug_info->wps_disabled;
257         }
258
259         i = hw_breakpoint_slot_setup(slots, max_slots, bp, ops);
260
261         if (WARN_ONCE(i < 0, "Can't find any breakpoint slot"))
262                 return i;
263
264         switch (ops) {
265         case HW_BREAKPOINT_INSTALL:
266                 /*
267                  * Ensure debug monitors are enabled at the correct exception
268                  * level.
269                  */
270                 enable_debug_monitors(dbg_el);
271                 /* Fall through */
272         case HW_BREAKPOINT_RESTORE:
273                 /* Setup the address register. */
274                 write_wb_reg(val_reg, i, info->address);
275
276                 /* Setup the control register. */
277                 ctrl = encode_ctrl_reg(info->ctrl);
278                 write_wb_reg(ctrl_reg, i,
279                              reg_enable ? ctrl | 0x1 : ctrl & ~0x1);
280                 break;
281         case HW_BREAKPOINT_UNINSTALL:
282                 /* Reset the control register. */
283                 write_wb_reg(ctrl_reg, i, 0);
284
285                 /*
286                  * Release the debug monitors for the correct exception
287                  * level.
288                  */
289                 disable_debug_monitors(dbg_el);
290                 break;
291         }
292
293         return 0;
294 }
295
296 /*
297  * Install a perf counter breakpoint.
298  */
299 int arch_install_hw_breakpoint(struct perf_event *bp)
300 {
301         return hw_breakpoint_control(bp, HW_BREAKPOINT_INSTALL);
302 }
303
304 void arch_uninstall_hw_breakpoint(struct perf_event *bp)
305 {
306         hw_breakpoint_control(bp, HW_BREAKPOINT_UNINSTALL);
307 }
308
309 static int get_hbp_len(u8 hbp_len)
310 {
311         unsigned int len_in_bytes = 0;
312
313         switch (hbp_len) {
314         case ARM_BREAKPOINT_LEN_1:
315                 len_in_bytes = 1;
316                 break;
317         case ARM_BREAKPOINT_LEN_2:
318                 len_in_bytes = 2;
319                 break;
320         case ARM_BREAKPOINT_LEN_3:
321                 len_in_bytes = 3;
322                 break;
323         case ARM_BREAKPOINT_LEN_4:
324                 len_in_bytes = 4;
325                 break;
326         case ARM_BREAKPOINT_LEN_5:
327                 len_in_bytes = 5;
328                 break;
329         case ARM_BREAKPOINT_LEN_6:
330                 len_in_bytes = 6;
331                 break;
332         case ARM_BREAKPOINT_LEN_7:
333                 len_in_bytes = 7;
334                 break;
335         case ARM_BREAKPOINT_LEN_8:
336                 len_in_bytes = 8;
337                 break;
338         }
339
340         return len_in_bytes;
341 }
342
343 /*
344  * Check whether bp virtual address is in kernel space.
345  */
346 int arch_check_bp_in_kernelspace(struct arch_hw_breakpoint *hw)
347 {
348         unsigned int len;
349         unsigned long va;
350
351         va = hw->address;
352         len = get_hbp_len(hw->ctrl.len);
353
354         return (va >= TASK_SIZE) && ((va + len - 1) >= TASK_SIZE);
355 }
356
357 /*
358  * Extract generic type and length encodings from an arch_hw_breakpoint_ctrl.
359  * Hopefully this will disappear when ptrace can bypass the conversion
360  * to generic breakpoint descriptions.
361  */
362 int arch_bp_generic_fields(struct arch_hw_breakpoint_ctrl ctrl,
363                            int *gen_len, int *gen_type, int *offset)
364 {
365         /* Type */
366         switch (ctrl.type) {
367         case ARM_BREAKPOINT_EXECUTE:
368                 *gen_type = HW_BREAKPOINT_X;
369                 break;
370         case ARM_BREAKPOINT_LOAD:
371                 *gen_type = HW_BREAKPOINT_R;
372                 break;
373         case ARM_BREAKPOINT_STORE:
374                 *gen_type = HW_BREAKPOINT_W;
375                 break;
376         case ARM_BREAKPOINT_LOAD | ARM_BREAKPOINT_STORE:
377                 *gen_type = HW_BREAKPOINT_RW;
378                 break;
379         default:
380                 return -EINVAL;
381         }
382
383         if (!ctrl.len)
384                 return -EINVAL;
385         *offset = __ffs(ctrl.len);
386
387         /* Len */
388         switch (ctrl.len >> *offset) {
389         case ARM_BREAKPOINT_LEN_1:
390                 *gen_len = HW_BREAKPOINT_LEN_1;
391                 break;
392         case ARM_BREAKPOINT_LEN_2:
393                 *gen_len = HW_BREAKPOINT_LEN_2;
394                 break;
395         case ARM_BREAKPOINT_LEN_3:
396                 *gen_len = HW_BREAKPOINT_LEN_3;
397                 break;
398         case ARM_BREAKPOINT_LEN_4:
399                 *gen_len = HW_BREAKPOINT_LEN_4;
400                 break;
401         case ARM_BREAKPOINT_LEN_5:
402                 *gen_len = HW_BREAKPOINT_LEN_5;
403                 break;
404         case ARM_BREAKPOINT_LEN_6:
405                 *gen_len = HW_BREAKPOINT_LEN_6;
406                 break;
407         case ARM_BREAKPOINT_LEN_7:
408                 *gen_len = HW_BREAKPOINT_LEN_7;
409                 break;
410         case ARM_BREAKPOINT_LEN_8:
411                 *gen_len = HW_BREAKPOINT_LEN_8;
412                 break;
413         default:
414                 return -EINVAL;
415         }
416
417         return 0;
418 }
419
420 /*
421  * Construct an arch_hw_breakpoint from a perf_event.
422  */
423 static int arch_build_bp_info(struct perf_event *bp,
424                               const struct perf_event_attr *attr,
425                               struct arch_hw_breakpoint *hw)
426 {
427         /* Type */
428         switch (attr->bp_type) {
429         case HW_BREAKPOINT_X:
430                 hw->ctrl.type = ARM_BREAKPOINT_EXECUTE;
431                 break;
432         case HW_BREAKPOINT_R:
433                 hw->ctrl.type = ARM_BREAKPOINT_LOAD;
434                 break;
435         case HW_BREAKPOINT_W:
436                 hw->ctrl.type = ARM_BREAKPOINT_STORE;
437                 break;
438         case HW_BREAKPOINT_RW:
439                 hw->ctrl.type = ARM_BREAKPOINT_LOAD | ARM_BREAKPOINT_STORE;
440                 break;
441         default:
442                 return -EINVAL;
443         }
444
445         /* Len */
446         switch (attr->bp_len) {
447         case HW_BREAKPOINT_LEN_1:
448                 hw->ctrl.len = ARM_BREAKPOINT_LEN_1;
449                 break;
450         case HW_BREAKPOINT_LEN_2:
451                 hw->ctrl.len = ARM_BREAKPOINT_LEN_2;
452                 break;
453         case HW_BREAKPOINT_LEN_3:
454                 hw->ctrl.len = ARM_BREAKPOINT_LEN_3;
455                 break;
456         case HW_BREAKPOINT_LEN_4:
457                 hw->ctrl.len = ARM_BREAKPOINT_LEN_4;
458                 break;
459         case HW_BREAKPOINT_LEN_5:
460                 hw->ctrl.len = ARM_BREAKPOINT_LEN_5;
461                 break;
462         case HW_BREAKPOINT_LEN_6:
463                 hw->ctrl.len = ARM_BREAKPOINT_LEN_6;
464                 break;
465         case HW_BREAKPOINT_LEN_7:
466                 hw->ctrl.len = ARM_BREAKPOINT_LEN_7;
467                 break;
468         case HW_BREAKPOINT_LEN_8:
469                 hw->ctrl.len = ARM_BREAKPOINT_LEN_8;
470                 break;
471         default:
472                 return -EINVAL;
473         }
474
475         /*
476          * On AArch64, we only permit breakpoints of length 4, whereas
477          * AArch32 also requires breakpoints of length 2 for Thumb.
478          * Watchpoints can be of length 1, 2, 4 or 8 bytes.
479          */
480         if (hw->ctrl.type == ARM_BREAKPOINT_EXECUTE) {
481                 if (is_compat_bp(bp)) {
482                         if (hw->ctrl.len != ARM_BREAKPOINT_LEN_2 &&
483                             hw->ctrl.len != ARM_BREAKPOINT_LEN_4)
484                                 return -EINVAL;
485                 } else if (hw->ctrl.len != ARM_BREAKPOINT_LEN_4) {
486                         /*
487                          * FIXME: Some tools (I'm looking at you perf) assume
488                          *        that breakpoints should be sizeof(long). This
489                          *        is nonsense. For now, we fix up the parameter
490                          *        but we should probably return -EINVAL instead.
491                          */
492                         hw->ctrl.len = ARM_BREAKPOINT_LEN_4;
493                 }
494         }
495
496         /* Address */
497         hw->address = attr->bp_addr;
498
499         /*
500          * Privilege
501          * Note that we disallow combined EL0/EL1 breakpoints because
502          * that would complicate the stepping code.
503          */
504         if (arch_check_bp_in_kernelspace(hw))
505                 hw->ctrl.privilege = AARCH64_BREAKPOINT_EL1;
506         else
507                 hw->ctrl.privilege = AARCH64_BREAKPOINT_EL0;
508
509         /* Enabled? */
510         hw->ctrl.enabled = !attr->disabled;
511
512         return 0;
513 }
514
515 /*
516  * Validate the arch-specific HW Breakpoint register settings.
517  */
518 int hw_breakpoint_arch_parse(struct perf_event *bp,
519                              const struct perf_event_attr *attr,
520                              struct arch_hw_breakpoint *hw)
521 {
522         int ret;
523         u64 alignment_mask, offset;
524
525         /* Build the arch_hw_breakpoint. */
526         ret = arch_build_bp_info(bp, attr, hw);
527         if (ret)
528                 return ret;
529
530         /*
531          * Check address alignment.
532          * We don't do any clever alignment correction for watchpoints
533          * because using 64-bit unaligned addresses is deprecated for
534          * AArch64.
535          *
536          * AArch32 tasks expect some simple alignment fixups, so emulate
537          * that here.
538          */
539         if (is_compat_bp(bp)) {
540                 if (hw->ctrl.len == ARM_BREAKPOINT_LEN_8)
541                         alignment_mask = 0x7;
542                 else
543                         alignment_mask = 0x3;
544                 offset = hw->address & alignment_mask;
545                 switch (offset) {
546                 case 0:
547                         /* Aligned */
548                         break;
549                 case 1:
550                 case 2:
551                         /* Allow halfword watchpoints and breakpoints. */
552                         if (hw->ctrl.len == ARM_BREAKPOINT_LEN_2)
553                                 break;
554                 case 3:
555                         /* Allow single byte watchpoint. */
556                         if (hw->ctrl.len == ARM_BREAKPOINT_LEN_1)
557                                 break;
558                 default:
559                         return -EINVAL;
560                 }
561         } else {
562                 if (hw->ctrl.type == ARM_BREAKPOINT_EXECUTE)
563                         alignment_mask = 0x3;
564                 else
565                         alignment_mask = 0x7;
566                 offset = hw->address & alignment_mask;
567         }
568
569         hw->address &= ~alignment_mask;
570         hw->ctrl.len <<= offset;
571
572         /*
573          * Disallow per-task kernel breakpoints since these would
574          * complicate the stepping code.
575          */
576         if (hw->ctrl.privilege == AARCH64_BREAKPOINT_EL1 && bp->hw.target)
577                 return -EINVAL;
578
579         return 0;
580 }
581
582 /*
583  * Enable/disable all of the breakpoints active at the specified
584  * exception level at the register level.
585  * This is used when single-stepping after a breakpoint exception.
586  */
587 static void toggle_bp_registers(int reg, enum dbg_active_el el, int enable)
588 {
589         int i, max_slots, privilege;
590         u32 ctrl;
591         struct perf_event **slots;
592
593         switch (reg) {
594         case AARCH64_DBG_REG_BCR:
595                 slots = this_cpu_ptr(bp_on_reg);
596                 max_slots = core_num_brps;
597                 break;
598         case AARCH64_DBG_REG_WCR:
599                 slots = this_cpu_ptr(wp_on_reg);
600                 max_slots = core_num_wrps;
601                 break;
602         default:
603                 return;
604         }
605
606         for (i = 0; i < max_slots; ++i) {
607                 if (!slots[i])
608                         continue;
609
610                 privilege = counter_arch_bp(slots[i])->ctrl.privilege;
611                 if (debug_exception_level(privilege) != el)
612                         continue;
613
614                 ctrl = read_wb_reg(reg, i);
615                 if (enable)
616                         ctrl |= 0x1;
617                 else
618                         ctrl &= ~0x1;
619                 write_wb_reg(reg, i, ctrl);
620         }
621 }
622 NOKPROBE_SYMBOL(toggle_bp_registers);
623
624 /*
625  * Debug exception handlers.
626  */
627 static int breakpoint_handler(unsigned long unused, unsigned int esr,
628                               struct pt_regs *regs)
629 {
630         int i, step = 0, *kernel_step;
631         u32 ctrl_reg;
632         u64 addr, val;
633         struct perf_event *bp, **slots;
634         struct debug_info *debug_info;
635         struct arch_hw_breakpoint_ctrl ctrl;
636
637         slots = this_cpu_ptr(bp_on_reg);
638         addr = instruction_pointer(regs);
639         debug_info = &current->thread.debug;
640
641         for (i = 0; i < core_num_brps; ++i) {
642                 rcu_read_lock();
643
644                 bp = slots[i];
645
646                 if (bp == NULL)
647                         goto unlock;
648
649                 /* Check if the breakpoint value matches. */
650                 val = read_wb_reg(AARCH64_DBG_REG_BVR, i);
651                 if (val != (addr & ~0x3))
652                         goto unlock;
653
654                 /* Possible match, check the byte address select to confirm. */
655                 ctrl_reg = read_wb_reg(AARCH64_DBG_REG_BCR, i);
656                 decode_ctrl_reg(ctrl_reg, &ctrl);
657                 if (!((1 << (addr & 0x3)) & ctrl.len))
658                         goto unlock;
659
660                 counter_arch_bp(bp)->trigger = addr;
661                 perf_bp_event(bp, regs);
662
663                 /* Do we need to handle the stepping? */
664                 if (uses_default_overflow_handler(bp))
665                         step = 1;
666 unlock:
667                 rcu_read_unlock();
668         }
669
670         if (!step)
671                 return 0;
672
673         if (user_mode(regs)) {
674                 debug_info->bps_disabled = 1;
675                 toggle_bp_registers(AARCH64_DBG_REG_BCR, DBG_ACTIVE_EL0, 0);
676
677                 /* If we're already stepping a watchpoint, just return. */
678                 if (debug_info->wps_disabled)
679                         return 0;
680
681                 if (test_thread_flag(TIF_SINGLESTEP))
682                         debug_info->suspended_step = 1;
683                 else
684                         user_enable_single_step(current);
685         } else {
686                 toggle_bp_registers(AARCH64_DBG_REG_BCR, DBG_ACTIVE_EL1, 0);
687                 kernel_step = this_cpu_ptr(&stepping_kernel_bp);
688
689                 if (*kernel_step != ARM_KERNEL_STEP_NONE)
690                         return 0;
691
692                 if (kernel_active_single_step()) {
693                         *kernel_step = ARM_KERNEL_STEP_SUSPEND;
694                 } else {
695                         *kernel_step = ARM_KERNEL_STEP_ACTIVE;
696                         kernel_enable_single_step(regs);
697                 }
698         }
699
700         return 0;
701 }
702 NOKPROBE_SYMBOL(breakpoint_handler);
703
704 /*
705  * Arm64 hardware does not always report a watchpoint hit address that matches
706  * one of the watchpoints set. It can also report an address "near" the
707  * watchpoint if a single instruction access both watched and unwatched
708  * addresses. There is no straight-forward way, short of disassembling the
709  * offending instruction, to map that address back to the watchpoint. This
710  * function computes the distance of the memory access from the watchpoint as a
711  * heuristic for the likelyhood that a given access triggered the watchpoint.
712  *
713  * See Section D2.10.5 "Determining the memory location that caused a Watchpoint
714  * exception" of ARMv8 Architecture Reference Manual for details.
715  *
716  * The function returns the distance of the address from the bytes watched by
717  * the watchpoint. In case of an exact match, it returns 0.
718  */
719 static u64 get_distance_from_watchpoint(unsigned long addr, u64 val,
720                                         struct arch_hw_breakpoint_ctrl *ctrl)
721 {
722         u64 wp_low, wp_high;
723         u32 lens, lene;
724
725         addr = untagged_addr(addr);
726
727         lens = __ffs(ctrl->len);
728         lene = __fls(ctrl->len);
729
730         wp_low = val + lens;
731         wp_high = val + lene;
732         if (addr < wp_low)
733                 return wp_low - addr;
734         else if (addr > wp_high)
735                 return addr - wp_high;
736         else
737                 return 0;
738 }
739
740 static int watchpoint_report(struct perf_event *wp, unsigned long addr,
741                              struct pt_regs *regs)
742 {
743         int step = uses_default_overflow_handler(wp);
744         struct arch_hw_breakpoint *info = counter_arch_bp(wp);
745
746         info->trigger = addr;
747
748         /*
749          * If we triggered a user watchpoint from a uaccess routine, then
750          * handle the stepping ourselves since userspace really can't help
751          * us with this.
752          */
753         if (!user_mode(regs) && info->ctrl.privilege == AARCH64_BREAKPOINT_EL0)
754                 step = 1;
755         else
756                 perf_bp_event(wp, regs);
757
758         return step;
759 }
760
761 static int watchpoint_handler(unsigned long addr, unsigned int esr,
762                               struct pt_regs *regs)
763 {
764         int i, step = 0, *kernel_step, access, closest_match = 0;
765         u64 min_dist = -1, dist;
766         u32 ctrl_reg;
767         u64 val;
768         struct perf_event *wp, **slots;
769         struct debug_info *debug_info;
770         struct arch_hw_breakpoint_ctrl ctrl;
771
772         slots = this_cpu_ptr(wp_on_reg);
773         debug_info = &current->thread.debug;
774
775         /*
776          * Find all watchpoints that match the reported address. If no exact
777          * match is found. Attribute the hit to the closest watchpoint.
778          */
779         rcu_read_lock();
780         for (i = 0; i < core_num_wrps; ++i) {
781                 wp = slots[i];
782                 if (wp == NULL)
783                         continue;
784
785                 /*
786                  * Check that the access type matches.
787                  * 0 => load, otherwise => store
788                  */
789                 access = (esr & AARCH64_ESR_ACCESS_MASK) ? HW_BREAKPOINT_W :
790                          HW_BREAKPOINT_R;
791                 if (!(access & hw_breakpoint_type(wp)))
792                         continue;
793
794                 /* Check if the watchpoint value and byte select match. */
795                 val = read_wb_reg(AARCH64_DBG_REG_WVR, i);
796                 ctrl_reg = read_wb_reg(AARCH64_DBG_REG_WCR, i);
797                 decode_ctrl_reg(ctrl_reg, &ctrl);
798                 dist = get_distance_from_watchpoint(addr, val, &ctrl);
799                 if (dist < min_dist) {
800                         min_dist = dist;
801                         closest_match = i;
802                 }
803                 /* Is this an exact match? */
804                 if (dist != 0)
805                         continue;
806
807                 step = watchpoint_report(wp, addr, regs);
808         }
809
810         /* No exact match found? */
811         if (min_dist > 0 && min_dist != -1)
812                 step = watchpoint_report(slots[closest_match], addr, regs);
813
814         rcu_read_unlock();
815
816         if (!step)
817                 return 0;
818
819         /*
820          * We always disable EL0 watchpoints because the kernel can
821          * cause these to fire via an unprivileged access.
822          */
823         toggle_bp_registers(AARCH64_DBG_REG_WCR, DBG_ACTIVE_EL0, 0);
824
825         if (user_mode(regs)) {
826                 debug_info->wps_disabled = 1;
827
828                 /* If we're already stepping a breakpoint, just return. */
829                 if (debug_info->bps_disabled)
830                         return 0;
831
832                 if (test_thread_flag(TIF_SINGLESTEP))
833                         debug_info->suspended_step = 1;
834                 else
835                         user_enable_single_step(current);
836         } else {
837                 toggle_bp_registers(AARCH64_DBG_REG_WCR, DBG_ACTIVE_EL1, 0);
838                 kernel_step = this_cpu_ptr(&stepping_kernel_bp);
839
840                 if (*kernel_step != ARM_KERNEL_STEP_NONE)
841                         return 0;
842
843                 if (kernel_active_single_step()) {
844                         *kernel_step = ARM_KERNEL_STEP_SUSPEND;
845                 } else {
846                         *kernel_step = ARM_KERNEL_STEP_ACTIVE;
847                         kernel_enable_single_step(regs);
848                 }
849         }
850
851         return 0;
852 }
853 NOKPROBE_SYMBOL(watchpoint_handler);
854
855 /*
856  * Handle single-step exception.
857  */
858 int reinstall_suspended_bps(struct pt_regs *regs)
859 {
860         struct debug_info *debug_info = &current->thread.debug;
861         int handled_exception = 0, *kernel_step;
862
863         kernel_step = this_cpu_ptr(&stepping_kernel_bp);
864
865         /*
866          * Called from single-step exception handler.
867          * Return 0 if execution can resume, 1 if a SIGTRAP should be
868          * reported.
869          */
870         if (user_mode(regs)) {
871                 if (debug_info->bps_disabled) {
872                         debug_info->bps_disabled = 0;
873                         toggle_bp_registers(AARCH64_DBG_REG_BCR, DBG_ACTIVE_EL0, 1);
874                         handled_exception = 1;
875                 }
876
877                 if (debug_info->wps_disabled) {
878                         debug_info->wps_disabled = 0;
879                         toggle_bp_registers(AARCH64_DBG_REG_WCR, DBG_ACTIVE_EL0, 1);
880                         handled_exception = 1;
881                 }
882
883                 if (handled_exception) {
884                         if (debug_info->suspended_step) {
885                                 debug_info->suspended_step = 0;
886                                 /* Allow exception handling to fall-through. */
887                                 handled_exception = 0;
888                         } else {
889                                 user_disable_single_step(current);
890                         }
891                 }
892         } else if (*kernel_step != ARM_KERNEL_STEP_NONE) {
893                 toggle_bp_registers(AARCH64_DBG_REG_BCR, DBG_ACTIVE_EL1, 1);
894                 toggle_bp_registers(AARCH64_DBG_REG_WCR, DBG_ACTIVE_EL1, 1);
895
896                 if (!debug_info->wps_disabled)
897                         toggle_bp_registers(AARCH64_DBG_REG_WCR, DBG_ACTIVE_EL0, 1);
898
899                 if (*kernel_step != ARM_KERNEL_STEP_SUSPEND) {
900                         kernel_disable_single_step();
901                         handled_exception = 1;
902                 } else {
903                         handled_exception = 0;
904                 }
905
906                 *kernel_step = ARM_KERNEL_STEP_NONE;
907         }
908
909         return !handled_exception;
910 }
911 NOKPROBE_SYMBOL(reinstall_suspended_bps);
912
913 /*
914  * Context-switcher for restoring suspended breakpoints.
915  */
916 void hw_breakpoint_thread_switch(struct task_struct *next)
917 {
918         /*
919          *           current        next
920          * disabled: 0              0     => The usual case, NOTIFY_DONE
921          *           0              1     => Disable the registers
922          *           1              0     => Enable the registers
923          *           1              1     => NOTIFY_DONE. per-task bps will
924          *                                   get taken care of by perf.
925          */
926
927         struct debug_info *current_debug_info, *next_debug_info;
928
929         current_debug_info = &current->thread.debug;
930         next_debug_info = &next->thread.debug;
931
932         /* Update breakpoints. */
933         if (current_debug_info->bps_disabled != next_debug_info->bps_disabled)
934                 toggle_bp_registers(AARCH64_DBG_REG_BCR,
935                                     DBG_ACTIVE_EL0,
936                                     !next_debug_info->bps_disabled);
937
938         /* Update watchpoints. */
939         if (current_debug_info->wps_disabled != next_debug_info->wps_disabled)
940                 toggle_bp_registers(AARCH64_DBG_REG_WCR,
941                                     DBG_ACTIVE_EL0,
942                                     !next_debug_info->wps_disabled);
943 }
944
945 /*
946  * CPU initialisation.
947  */
948 static int hw_breakpoint_reset(unsigned int cpu)
949 {
950         int i;
951         struct perf_event **slots;
952         /*
953          * When a CPU goes through cold-boot, it does not have any installed
954          * slot, so it is safe to share the same function for restoring and
955          * resetting breakpoints; when a CPU is hotplugged in, it goes
956          * through the slots, which are all empty, hence it just resets control
957          * and value for debug registers.
958          * When this function is triggered on warm-boot through a CPU PM
959          * notifier some slots might be initialized; if so they are
960          * reprogrammed according to the debug slots content.
961          */
962         for (slots = this_cpu_ptr(bp_on_reg), i = 0; i < core_num_brps; ++i) {
963                 if (slots[i]) {
964                         hw_breakpoint_control(slots[i], HW_BREAKPOINT_RESTORE);
965                 } else {
966                         write_wb_reg(AARCH64_DBG_REG_BCR, i, 0UL);
967                         write_wb_reg(AARCH64_DBG_REG_BVR, i, 0UL);
968                 }
969         }
970
971         for (slots = this_cpu_ptr(wp_on_reg), i = 0; i < core_num_wrps; ++i) {
972                 if (slots[i]) {
973                         hw_breakpoint_control(slots[i], HW_BREAKPOINT_RESTORE);
974                 } else {
975                         write_wb_reg(AARCH64_DBG_REG_WCR, i, 0UL);
976                         write_wb_reg(AARCH64_DBG_REG_WVR, i, 0UL);
977                 }
978         }
979
980         return 0;
981 }
982
983 #ifdef CONFIG_CPU_PM
984 extern void cpu_suspend_set_dbg_restorer(int (*hw_bp_restore)(unsigned int));
985 #else
986 static inline void cpu_suspend_set_dbg_restorer(int (*hw_bp_restore)(unsigned int))
987 {
988 }
989 #endif
990
991 /*
992  * One-time initialisation.
993  */
994 static int __init arch_hw_breakpoint_init(void)
995 {
996         int ret;
997
998         core_num_brps = get_num_brps();
999         core_num_wrps = get_num_wrps();
1000
1001         pr_info("found %d breakpoint and %d watchpoint registers.\n",
1002                 core_num_brps, core_num_wrps);
1003
1004         /* Register debug fault handlers. */
1005         hook_debug_fault_code(DBG_ESR_EVT_HWBP, breakpoint_handler, SIGTRAP,
1006                               TRAP_HWBKPT, "hw-breakpoint handler");
1007         hook_debug_fault_code(DBG_ESR_EVT_HWWP, watchpoint_handler, SIGTRAP,
1008                               TRAP_HWBKPT, "hw-watchpoint handler");
1009
1010         /*
1011          * Reset the breakpoint resources. We assume that a halting
1012          * debugger will leave the world in a nice state for us.
1013          */
1014         ret = cpuhp_setup_state(CPUHP_AP_PERF_ARM_HW_BREAKPOINT_STARTING,
1015                           "perf/arm64/hw_breakpoint:starting",
1016                           hw_breakpoint_reset, NULL);
1017         if (ret)
1018                 pr_err("failed to register CPU hotplug notifier: %d\n", ret);
1019
1020         /* Register cpu_suspend hw breakpoint restore hook */
1021         cpu_suspend_set_dbg_restorer(hw_breakpoint_reset);
1022
1023         return ret;
1024 }
1025 arch_initcall(arch_hw_breakpoint_init);
1026
1027 void hw_breakpoint_pmu_read(struct perf_event *bp)
1028 {
1029 }
1030
1031 /*
1032  * Dummy function to register with die_notifier.
1033  */
1034 int hw_breakpoint_exceptions_notify(struct notifier_block *unused,
1035                                     unsigned long val, void *data)
1036 {
1037         return NOTIFY_DONE;
1038 }