]>
Commit | Line | Data |
---|---|---|
f3f096cf SD |
1 | /* |
2 | * uprobes-based tracing events | |
3 | * | |
4 | * This program is free software; you can redistribute it and/or modify | |
5 | * it under the terms of the GNU General Public License version 2 as | |
6 | * published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope that it will be useful, | |
9 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
11 | * GNU General Public License for more details. | |
12 | * | |
13 | * You should have received a copy of the GNU General Public License | |
14 | * along with this program; if not, write to the Free Software | |
15 | * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | |
16 | * | |
17 | * Copyright (C) IBM Corporation, 2010-2012 | |
18 | * Author: Srikar Dronamraju <[email protected]> | |
19 | */ | |
20 | ||
21 | #include <linux/module.h> | |
22 | #include <linux/uaccess.h> | |
23 | #include <linux/uprobes.h> | |
24 | #include <linux/namei.h> | |
b2e902f0 | 25 | #include <linux/string.h> |
f3f096cf SD |
26 | |
27 | #include "trace_probe.h" | |
28 | ||
29 | #define UPROBE_EVENT_SYSTEM "uprobes" | |
30 | ||
457d1772 ON |
31 | struct uprobe_trace_entry_head { |
32 | struct trace_entry ent; | |
33 | unsigned long vaddr[]; | |
34 | }; | |
35 | ||
36 | #define SIZEOF_TRACE_ENTRY(is_return) \ | |
37 | (sizeof(struct uprobe_trace_entry_head) + \ | |
38 | sizeof(unsigned long) * (is_return ? 2 : 1)) | |
39 | ||
40 | #define DATAOF_TRACE_ENTRY(entry, is_return) \ | |
41 | ((void*)(entry) + SIZEOF_TRACE_ENTRY(is_return)) | |
42 | ||
736288ba ON |
43 | struct trace_uprobe_filter { |
44 | rwlock_t rwlock; | |
45 | int nr_systemwide; | |
46 | struct list_head perf_events; | |
47 | }; | |
48 | ||
f3f096cf SD |
49 | /* |
50 | * uprobe event core functions | |
51 | */ | |
f3f096cf SD |
52 | struct trace_uprobe { |
53 | struct list_head list; | |
736288ba | 54 | struct trace_uprobe_filter filter; |
a932b738 | 55 | struct uprobe_consumer consumer; |
f3f096cf SD |
56 | struct inode *inode; |
57 | char *filename; | |
58 | unsigned long offset; | |
59 | unsigned long nhit; | |
14577c39 | 60 | struct trace_probe tp; |
f3f096cf SD |
61 | }; |
62 | ||
14577c39 NK |
63 | #define SIZEOF_TRACE_UPROBE(n) \ |
64 | (offsetof(struct trace_uprobe, tp.args) + \ | |
f3f096cf SD |
65 | (sizeof(struct probe_arg) * (n))) |
66 | ||
67 | static int register_uprobe_event(struct trace_uprobe *tu); | |
c6c2401d | 68 | static int unregister_uprobe_event(struct trace_uprobe *tu); |
f3f096cf SD |
69 | |
70 | static DEFINE_MUTEX(uprobe_lock); | |
71 | static LIST_HEAD(uprobe_list); | |
72 | ||
b7e0bf34 NK |
73 | struct uprobe_dispatch_data { |
74 | struct trace_uprobe *tu; | |
75 | unsigned long bp_addr; | |
76 | }; | |
77 | ||
f3f096cf | 78 | static int uprobe_dispatcher(struct uprobe_consumer *con, struct pt_regs *regs); |
c1ae5c75 ON |
79 | static int uretprobe_dispatcher(struct uprobe_consumer *con, |
80 | unsigned long func, struct pt_regs *regs); | |
f3f096cf | 81 | |
3fd996a2 NK |
82 | #ifdef CONFIG_STACK_GROWSUP |
83 | static unsigned long adjust_stack_addr(unsigned long addr, unsigned int n) | |
84 | { | |
85 | return addr - (n * sizeof(long)); | |
86 | } | |
87 | #else | |
88 | static unsigned long adjust_stack_addr(unsigned long addr, unsigned int n) | |
89 | { | |
90 | return addr + (n * sizeof(long)); | |
91 | } | |
92 | #endif | |
93 | ||
94 | static unsigned long get_user_stack_nth(struct pt_regs *regs, unsigned int n) | |
95 | { | |
96 | unsigned long ret; | |
97 | unsigned long addr = user_stack_pointer(regs); | |
98 | ||
99 | addr = adjust_stack_addr(addr, n); | |
100 | ||
101 | if (copy_from_user(&ret, (void __force __user *) addr, sizeof(ret))) | |
102 | return 0; | |
103 | ||
104 | return ret; | |
105 | } | |
106 | ||
107 | /* | |
108 | * Uprobes-specific fetch functions | |
109 | */ | |
110 | #define DEFINE_FETCH_stack(type) \ | |
fbc1963d MH |
111 | static void FETCH_FUNC_NAME(stack, type)(struct pt_regs *regs, \ |
112 | void *offset, void *dest) \ | |
3fd996a2 NK |
113 | { \ |
114 | *(type *)dest = (type)get_user_stack_nth(regs, \ | |
115 | ((unsigned long)offset)); \ | |
116 | } | |
117 | DEFINE_BASIC_FETCH_FUNCS(stack) | |
118 | /* No string on the stack entry */ | |
119 | #define fetch_stack_string NULL | |
120 | #define fetch_stack_string_size NULL | |
121 | ||
5baaa59e | 122 | #define DEFINE_FETCH_memory(type) \ |
fbc1963d MH |
123 | static void FETCH_FUNC_NAME(memory, type)(struct pt_regs *regs, \ |
124 | void *addr, void *dest) \ | |
5baaa59e NK |
125 | { \ |
126 | type retval; \ | |
127 | void __user *vaddr = (void __force __user *) addr; \ | |
128 | \ | |
129 | if (copy_from_user(&retval, vaddr, sizeof(type))) \ | |
130 | *(type *)dest = 0; \ | |
131 | else \ | |
132 | *(type *) dest = retval; \ | |
133 | } | |
134 | DEFINE_BASIC_FETCH_FUNCS(memory) | |
135 | /* | |
136 | * Fetch a null-terminated string. Caller MUST set *(u32 *)dest with max | |
137 | * length and relative data location. | |
138 | */ | |
fbc1963d MH |
139 | static void FETCH_FUNC_NAME(memory, string)(struct pt_regs *regs, |
140 | void *addr, void *dest) | |
5baaa59e NK |
141 | { |
142 | long ret; | |
143 | u32 rloc = *(u32 *)dest; | |
144 | int maxlen = get_rloc_len(rloc); | |
145 | u8 *dst = get_rloc_data(dest); | |
146 | void __user *src = (void __force __user *) addr; | |
147 | ||
148 | if (!maxlen) | |
149 | return; | |
150 | ||
151 | ret = strncpy_from_user(dst, src, maxlen); | |
152 | ||
153 | if (ret < 0) { /* Failed to fetch string */ | |
154 | ((u8 *)get_rloc_data(dest))[0] = '\0'; | |
155 | *(u32 *)dest = make_data_rloc(0, get_rloc_offs(rloc)); | |
156 | } else { | |
157 | *(u32 *)dest = make_data_rloc(ret, get_rloc_offs(rloc)); | |
158 | } | |
159 | } | |
160 | ||
fbc1963d MH |
161 | static void FETCH_FUNC_NAME(memory, string_size)(struct pt_regs *regs, |
162 | void *addr, void *dest) | |
5baaa59e NK |
163 | { |
164 | int len; | |
165 | void __user *vaddr = (void __force __user *) addr; | |
166 | ||
167 | len = strnlen_user(vaddr, MAX_STRING_SIZE); | |
168 | ||
169 | if (len == 0 || len > MAX_STRING_SIZE) /* Failed to check length */ | |
170 | *(u32 *)dest = 0; | |
171 | else | |
172 | *(u32 *)dest = len; | |
173 | } | |
3fd996a2 | 174 | |
b7e0bf34 NK |
175 | static unsigned long translate_user_vaddr(void *file_offset) |
176 | { | |
177 | unsigned long base_addr; | |
178 | struct uprobe_dispatch_data *udd; | |
179 | ||
180 | udd = (void *) current->utask->vaddr; | |
181 | ||
182 | base_addr = udd->bp_addr - udd->tu->offset; | |
183 | return base_addr + (unsigned long)file_offset; | |
184 | } | |
185 | ||
186 | #define DEFINE_FETCH_file_offset(type) \ | |
fbc1963d MH |
187 | static void FETCH_FUNC_NAME(file_offset, type)(struct pt_regs *regs, \ |
188 | void *offset, void *dest)\ | |
b7e0bf34 NK |
189 | { \ |
190 | void *vaddr = (void *)translate_user_vaddr(offset); \ | |
191 | \ | |
192 | FETCH_FUNC_NAME(memory, type)(regs, vaddr, dest); \ | |
193 | } | |
194 | DEFINE_BASIC_FETCH_FUNCS(file_offset) | |
195 | DEFINE_FETCH_file_offset(string) | |
196 | DEFINE_FETCH_file_offset(string_size) | |
197 | ||
34fee3a1 | 198 | /* Fetch type information table */ |
d9a16d3a | 199 | static const struct fetch_type uprobes_fetch_type_table[] = { |
34fee3a1 NK |
200 | /* Special types */ |
201 | [FETCH_TYPE_STRING] = __ASSIGN_FETCH_TYPE("string", string, string, | |
202 | sizeof(u32), 1, "__data_loc char[]"), | |
203 | [FETCH_TYPE_STRSIZE] = __ASSIGN_FETCH_TYPE("string_size", u32, | |
204 | string_size, sizeof(u32), 0, "u32"), | |
205 | /* Basic types */ | |
206 | ASSIGN_FETCH_TYPE(u8, u8, 0), | |
207 | ASSIGN_FETCH_TYPE(u16, u16, 0), | |
208 | ASSIGN_FETCH_TYPE(u32, u32, 0), | |
209 | ASSIGN_FETCH_TYPE(u64, u64, 0), | |
210 | ASSIGN_FETCH_TYPE(s8, u8, 1), | |
211 | ASSIGN_FETCH_TYPE(s16, u16, 1), | |
212 | ASSIGN_FETCH_TYPE(s32, u32, 1), | |
213 | ASSIGN_FETCH_TYPE(s64, u64, 1), | |
214 | ||
215 | ASSIGN_FETCH_TYPE_END | |
216 | }; | |
217 | ||
736288ba ON |
218 | static inline void init_trace_uprobe_filter(struct trace_uprobe_filter *filter) |
219 | { | |
220 | rwlock_init(&filter->rwlock); | |
221 | filter->nr_systemwide = 0; | |
222 | INIT_LIST_HEAD(&filter->perf_events); | |
223 | } | |
224 | ||
225 | static inline bool uprobe_filter_is_empty(struct trace_uprobe_filter *filter) | |
226 | { | |
227 | return !filter->nr_systemwide && list_empty(&filter->perf_events); | |
228 | } | |
229 | ||
c1ae5c75 ON |
230 | static inline bool is_ret_probe(struct trace_uprobe *tu) |
231 | { | |
232 | return tu->consumer.ret_handler != NULL; | |
233 | } | |
234 | ||
f3f096cf SD |
235 | /* |
236 | * Allocate new trace_uprobe and initialize it (including uprobes). | |
237 | */ | |
238 | static struct trace_uprobe * | |
c1ae5c75 | 239 | alloc_trace_uprobe(const char *group, const char *event, int nargs, bool is_ret) |
f3f096cf SD |
240 | { |
241 | struct trace_uprobe *tu; | |
242 | ||
243 | if (!event || !is_good_name(event)) | |
244 | return ERR_PTR(-EINVAL); | |
245 | ||
246 | if (!group || !is_good_name(group)) | |
247 | return ERR_PTR(-EINVAL); | |
248 | ||
249 | tu = kzalloc(SIZEOF_TRACE_UPROBE(nargs), GFP_KERNEL); | |
250 | if (!tu) | |
251 | return ERR_PTR(-ENOMEM); | |
252 | ||
14577c39 NK |
253 | tu->tp.call.class = &tu->tp.class; |
254 | tu->tp.call.name = kstrdup(event, GFP_KERNEL); | |
255 | if (!tu->tp.call.name) | |
f3f096cf SD |
256 | goto error; |
257 | ||
14577c39 NK |
258 | tu->tp.class.system = kstrdup(group, GFP_KERNEL); |
259 | if (!tu->tp.class.system) | |
f3f096cf SD |
260 | goto error; |
261 | ||
262 | INIT_LIST_HEAD(&tu->list); | |
70ed91c6 | 263 | INIT_LIST_HEAD(&tu->tp.files); |
a932b738 | 264 | tu->consumer.handler = uprobe_dispatcher; |
c1ae5c75 ON |
265 | if (is_ret) |
266 | tu->consumer.ret_handler = uretprobe_dispatcher; | |
736288ba | 267 | init_trace_uprobe_filter(&tu->filter); |
f3f096cf SD |
268 | return tu; |
269 | ||
270 | error: | |
14577c39 | 271 | kfree(tu->tp.call.name); |
f3f096cf SD |
272 | kfree(tu); |
273 | ||
274 | return ERR_PTR(-ENOMEM); | |
275 | } | |
276 | ||
277 | static void free_trace_uprobe(struct trace_uprobe *tu) | |
278 | { | |
279 | int i; | |
280 | ||
14577c39 NK |
281 | for (i = 0; i < tu->tp.nr_args; i++) |
282 | traceprobe_free_probe_arg(&tu->tp.args[i]); | |
f3f096cf SD |
283 | |
284 | iput(tu->inode); | |
14577c39 NK |
285 | kfree(tu->tp.call.class->system); |
286 | kfree(tu->tp.call.name); | |
f3f096cf SD |
287 | kfree(tu->filename); |
288 | kfree(tu); | |
289 | } | |
290 | ||
291 | static struct trace_uprobe *find_probe_event(const char *event, const char *group) | |
292 | { | |
293 | struct trace_uprobe *tu; | |
294 | ||
295 | list_for_each_entry(tu, &uprobe_list, list) | |
687fcc4a | 296 | if (strcmp(trace_event_name(&tu->tp.call), event) == 0 && |
14577c39 | 297 | strcmp(tu->tp.call.class->system, group) == 0) |
f3f096cf SD |
298 | return tu; |
299 | ||
300 | return NULL; | |
301 | } | |
302 | ||
303 | /* Unregister a trace_uprobe and probe_event: call with locking uprobe_lock */ | |
c6c2401d | 304 | static int unregister_trace_uprobe(struct trace_uprobe *tu) |
f3f096cf | 305 | { |
c6c2401d SRRH |
306 | int ret; |
307 | ||
308 | ret = unregister_uprobe_event(tu); | |
309 | if (ret) | |
310 | return ret; | |
311 | ||
f3f096cf | 312 | list_del(&tu->list); |
f3f096cf | 313 | free_trace_uprobe(tu); |
c6c2401d | 314 | return 0; |
f3f096cf SD |
315 | } |
316 | ||
317 | /* Register a trace_uprobe and probe_event */ | |
318 | static int register_trace_uprobe(struct trace_uprobe *tu) | |
319 | { | |
14577c39 | 320 | struct trace_uprobe *old_tu; |
f3f096cf SD |
321 | int ret; |
322 | ||
323 | mutex_lock(&uprobe_lock); | |
324 | ||
325 | /* register as an event */ | |
687fcc4a | 326 | old_tu = find_probe_event(trace_event_name(&tu->tp.call), |
de7b2973 | 327 | tu->tp.call.class->system); |
14577c39 | 328 | if (old_tu) { |
f3f096cf | 329 | /* delete old event */ |
14577c39 | 330 | ret = unregister_trace_uprobe(old_tu); |
c6c2401d SRRH |
331 | if (ret) |
332 | goto end; | |
333 | } | |
f3f096cf SD |
334 | |
335 | ret = register_uprobe_event(tu); | |
336 | if (ret) { | |
337 | pr_warning("Failed to register probe event(%d)\n", ret); | |
338 | goto end; | |
339 | } | |
340 | ||
341 | list_add_tail(&tu->list, &uprobe_list); | |
342 | ||
343 | end: | |
344 | mutex_unlock(&uprobe_lock); | |
345 | ||
346 | return ret; | |
347 | } | |
348 | ||
349 | /* | |
350 | * Argument syntax: | |
306cfe20 | 351 | * - Add uprobe: p|r[:[GRP/]EVENT] PATH:OFFSET [FETCHARGS] |
f3f096cf SD |
352 | * |
353 | * - Remove uprobe: -:[GRP/]EVENT | |
354 | */ | |
355 | static int create_trace_uprobe(int argc, char **argv) | |
356 | { | |
357 | struct trace_uprobe *tu; | |
358 | struct inode *inode; | |
359 | char *arg, *event, *group, *filename; | |
360 | char buf[MAX_EVENT_NAME_LEN]; | |
361 | struct path path; | |
362 | unsigned long offset; | |
4ee5a52e | 363 | bool is_delete, is_return; |
f3f096cf SD |
364 | int i, ret; |
365 | ||
366 | inode = NULL; | |
367 | ret = 0; | |
368 | is_delete = false; | |
4ee5a52e | 369 | is_return = false; |
f3f096cf SD |
370 | event = NULL; |
371 | group = NULL; | |
372 | ||
373 | /* argc must be >= 1 */ | |
374 | if (argv[0][0] == '-') | |
375 | is_delete = true; | |
4ee5a52e ON |
376 | else if (argv[0][0] == 'r') |
377 | is_return = true; | |
f3f096cf | 378 | else if (argv[0][0] != 'p') { |
4ee5a52e | 379 | pr_info("Probe definition must be started with 'p', 'r' or '-'.\n"); |
f3f096cf SD |
380 | return -EINVAL; |
381 | } | |
382 | ||
383 | if (argv[0][1] == ':') { | |
384 | event = &argv[0][2]; | |
385 | arg = strchr(event, '/'); | |
386 | ||
387 | if (arg) { | |
388 | group = event; | |
389 | event = arg + 1; | |
390 | event[-1] = '\0'; | |
391 | ||
392 | if (strlen(group) == 0) { | |
393 | pr_info("Group name is not specified\n"); | |
394 | return -EINVAL; | |
395 | } | |
396 | } | |
397 | if (strlen(event) == 0) { | |
398 | pr_info("Event name is not specified\n"); | |
399 | return -EINVAL; | |
400 | } | |
401 | } | |
402 | if (!group) | |
403 | group = UPROBE_EVENT_SYSTEM; | |
404 | ||
405 | if (is_delete) { | |
c6c2401d SRRH |
406 | int ret; |
407 | ||
f3f096cf SD |
408 | if (!event) { |
409 | pr_info("Delete command needs an event name.\n"); | |
410 | return -EINVAL; | |
411 | } | |
412 | mutex_lock(&uprobe_lock); | |
413 | tu = find_probe_event(event, group); | |
414 | ||
415 | if (!tu) { | |
416 | mutex_unlock(&uprobe_lock); | |
417 | pr_info("Event %s/%s doesn't exist.\n", group, event); | |
418 | return -ENOENT; | |
419 | } | |
420 | /* delete an event */ | |
c6c2401d | 421 | ret = unregister_trace_uprobe(tu); |
f3f096cf | 422 | mutex_unlock(&uprobe_lock); |
c6c2401d | 423 | return ret; |
f3f096cf SD |
424 | } |
425 | ||
426 | if (argc < 2) { | |
427 | pr_info("Probe point is not specified.\n"); | |
428 | return -EINVAL; | |
429 | } | |
430 | if (isdigit(argv[1][0])) { | |
431 | pr_info("probe point must be have a filename.\n"); | |
432 | return -EINVAL; | |
433 | } | |
434 | arg = strchr(argv[1], ':'); | |
fa44063f J |
435 | if (!arg) { |
436 | ret = -EINVAL; | |
f3f096cf | 437 | goto fail_address_parse; |
fa44063f | 438 | } |
f3f096cf SD |
439 | |
440 | *arg++ = '\0'; | |
441 | filename = argv[1]; | |
442 | ret = kern_path(filename, LOOKUP_FOLLOW, &path); | |
443 | if (ret) | |
444 | goto fail_address_parse; | |
445 | ||
7682c918 | 446 | inode = igrab(d_inode(path.dentry)); |
84d7ed79 ON |
447 | path_put(&path); |
448 | ||
7e4e28c5 | 449 | if (!inode || !S_ISREG(inode->i_mode)) { |
d24d7dbf JZ |
450 | ret = -EINVAL; |
451 | goto fail_address_parse; | |
452 | } | |
f3f096cf | 453 | |
84d7ed79 ON |
454 | ret = kstrtoul(arg, 0, &offset); |
455 | if (ret) | |
456 | goto fail_address_parse; | |
457 | ||
f3f096cf SD |
458 | argc -= 2; |
459 | argv += 2; | |
460 | ||
461 | /* setup a probe */ | |
462 | if (!event) { | |
b2e902f0 | 463 | char *tail; |
f3f096cf SD |
464 | char *ptr; |
465 | ||
b2e902f0 AS |
466 | tail = kstrdup(kbasename(filename), GFP_KERNEL); |
467 | if (!tail) { | |
f3f096cf SD |
468 | ret = -ENOMEM; |
469 | goto fail_address_parse; | |
470 | } | |
471 | ||
f3f096cf SD |
472 | ptr = strpbrk(tail, ".-_"); |
473 | if (ptr) | |
474 | *ptr = '\0'; | |
475 | ||
476 | snprintf(buf, MAX_EVENT_NAME_LEN, "%c_%s_0x%lx", 'p', tail, offset); | |
477 | event = buf; | |
478 | kfree(tail); | |
479 | } | |
480 | ||
4ee5a52e | 481 | tu = alloc_trace_uprobe(group, event, argc, is_return); |
f3f096cf SD |
482 | if (IS_ERR(tu)) { |
483 | pr_info("Failed to allocate trace_uprobe.(%d)\n", (int)PTR_ERR(tu)); | |
484 | ret = PTR_ERR(tu); | |
485 | goto fail_address_parse; | |
486 | } | |
487 | tu->offset = offset; | |
488 | tu->inode = inode; | |
489 | tu->filename = kstrdup(filename, GFP_KERNEL); | |
490 | ||
491 | if (!tu->filename) { | |
492 | pr_info("Failed to allocate filename.\n"); | |
493 | ret = -ENOMEM; | |
494 | goto error; | |
495 | } | |
496 | ||
497 | /* parse arguments */ | |
498 | ret = 0; | |
499 | for (i = 0; i < argc && i < MAX_TRACE_ARGS; i++) { | |
14577c39 NK |
500 | struct probe_arg *parg = &tu->tp.args[i]; |
501 | ||
f3f096cf | 502 | /* Increment count for freeing args in error case */ |
14577c39 | 503 | tu->tp.nr_args++; |
f3f096cf SD |
504 | |
505 | /* Parse argument name */ | |
506 | arg = strchr(argv[i], '='); | |
507 | if (arg) { | |
508 | *arg++ = '\0'; | |
14577c39 | 509 | parg->name = kstrdup(argv[i], GFP_KERNEL); |
f3f096cf SD |
510 | } else { |
511 | arg = argv[i]; | |
512 | /* If argument name is omitted, set "argN" */ | |
513 | snprintf(buf, MAX_EVENT_NAME_LEN, "arg%d", i + 1); | |
14577c39 | 514 | parg->name = kstrdup(buf, GFP_KERNEL); |
f3f096cf SD |
515 | } |
516 | ||
14577c39 | 517 | if (!parg->name) { |
f3f096cf SD |
518 | pr_info("Failed to allocate argument[%d] name.\n", i); |
519 | ret = -ENOMEM; | |
520 | goto error; | |
521 | } | |
522 | ||
14577c39 NK |
523 | if (!is_good_name(parg->name)) { |
524 | pr_info("Invalid argument[%d] name: %s\n", i, parg->name); | |
f3f096cf SD |
525 | ret = -EINVAL; |
526 | goto error; | |
527 | } | |
528 | ||
14577c39 | 529 | if (traceprobe_conflict_field_name(parg->name, tu->tp.args, i)) { |
f3f096cf SD |
530 | pr_info("Argument[%d] name '%s' conflicts with " |
531 | "another field.\n", i, argv[i]); | |
532 | ret = -EINVAL; | |
533 | goto error; | |
534 | } | |
535 | ||
536 | /* Parse fetch argument */ | |
14577c39 | 537 | ret = traceprobe_parse_probe_arg(arg, &tu->tp.size, parg, |
d9a16d3a SR |
538 | is_return, false, |
539 | uprobes_fetch_type_table); | |
f3f096cf SD |
540 | if (ret) { |
541 | pr_info("Parse error at argument[%d]. (%d)\n", i, ret); | |
542 | goto error; | |
543 | } | |
544 | } | |
545 | ||
546 | ret = register_trace_uprobe(tu); | |
547 | if (ret) | |
548 | goto error; | |
549 | return 0; | |
550 | ||
551 | error: | |
552 | free_trace_uprobe(tu); | |
553 | return ret; | |
554 | ||
555 | fail_address_parse: | |
16a8ef27 | 556 | iput(inode); |
f3f096cf | 557 | |
d24d7dbf | 558 | pr_info("Failed to parse address or file.\n"); |
f3f096cf SD |
559 | |
560 | return ret; | |
561 | } | |
562 | ||
c6c2401d | 563 | static int cleanup_all_probes(void) |
f3f096cf SD |
564 | { |
565 | struct trace_uprobe *tu; | |
c6c2401d | 566 | int ret = 0; |
f3f096cf SD |
567 | |
568 | mutex_lock(&uprobe_lock); | |
569 | while (!list_empty(&uprobe_list)) { | |
570 | tu = list_entry(uprobe_list.next, struct trace_uprobe, list); | |
c6c2401d SRRH |
571 | ret = unregister_trace_uprobe(tu); |
572 | if (ret) | |
573 | break; | |
f3f096cf SD |
574 | } |
575 | mutex_unlock(&uprobe_lock); | |
c6c2401d | 576 | return ret; |
f3f096cf SD |
577 | } |
578 | ||
579 | /* Probes listing interfaces */ | |
580 | static void *probes_seq_start(struct seq_file *m, loff_t *pos) | |
581 | { | |
582 | mutex_lock(&uprobe_lock); | |
583 | return seq_list_start(&uprobe_list, *pos); | |
584 | } | |
585 | ||
586 | static void *probes_seq_next(struct seq_file *m, void *v, loff_t *pos) | |
587 | { | |
588 | return seq_list_next(v, &uprobe_list, pos); | |
589 | } | |
590 | ||
591 | static void probes_seq_stop(struct seq_file *m, void *v) | |
592 | { | |
593 | mutex_unlock(&uprobe_lock); | |
594 | } | |
595 | ||
596 | static int probes_seq_show(struct seq_file *m, void *v) | |
597 | { | |
598 | struct trace_uprobe *tu = v; | |
3ede82dd | 599 | char c = is_ret_probe(tu) ? 'r' : 'p'; |
f3f096cf SD |
600 | int i; |
601 | ||
de7b2973 | 602 | seq_printf(m, "%c:%s/%s", c, tu->tp.call.class->system, |
687fcc4a | 603 | trace_event_name(&tu->tp.call)); |
a2fb3382 WN |
604 | seq_printf(m, " %s:", tu->filename); |
605 | ||
606 | /* Don't print "0x (null)" when offset is 0 */ | |
607 | if (tu->offset) { | |
608 | seq_printf(m, "0x%p", (void *)tu->offset); | |
609 | } else { | |
610 | switch (sizeof(void *)) { | |
611 | case 4: | |
612 | seq_printf(m, "0x00000000"); | |
613 | break; | |
614 | case 8: | |
615 | default: | |
616 | seq_printf(m, "0x0000000000000000"); | |
617 | break; | |
618 | } | |
619 | } | |
f3f096cf | 620 | |
14577c39 NK |
621 | for (i = 0; i < tu->tp.nr_args; i++) |
622 | seq_printf(m, " %s=%s", tu->tp.args[i].name, tu->tp.args[i].comm); | |
f3f096cf | 623 | |
fa6f0cc7 | 624 | seq_putc(m, '\n'); |
f3f096cf SD |
625 | return 0; |
626 | } | |
627 | ||
628 | static const struct seq_operations probes_seq_op = { | |
629 | .start = probes_seq_start, | |
630 | .next = probes_seq_next, | |
631 | .stop = probes_seq_stop, | |
632 | .show = probes_seq_show | |
633 | }; | |
634 | ||
635 | static int probes_open(struct inode *inode, struct file *file) | |
636 | { | |
c6c2401d SRRH |
637 | int ret; |
638 | ||
639 | if ((file->f_mode & FMODE_WRITE) && (file->f_flags & O_TRUNC)) { | |
640 | ret = cleanup_all_probes(); | |
641 | if (ret) | |
642 | return ret; | |
643 | } | |
f3f096cf SD |
644 | |
645 | return seq_open(file, &probes_seq_op); | |
646 | } | |
647 | ||
648 | static ssize_t probes_write(struct file *file, const char __user *buffer, | |
649 | size_t count, loff_t *ppos) | |
650 | { | |
651 | return traceprobe_probes_write(file, buffer, count, ppos, create_trace_uprobe); | |
652 | } | |
653 | ||
654 | static const struct file_operations uprobe_events_ops = { | |
655 | .owner = THIS_MODULE, | |
656 | .open = probes_open, | |
657 | .read = seq_read, | |
658 | .llseek = seq_lseek, | |
659 | .release = seq_release, | |
660 | .write = probes_write, | |
661 | }; | |
662 | ||
663 | /* Probes profiling interfaces */ | |
664 | static int probes_profile_seq_show(struct seq_file *m, void *v) | |
665 | { | |
666 | struct trace_uprobe *tu = v; | |
667 | ||
de7b2973 | 668 | seq_printf(m, " %s %-44s %15lu\n", tu->filename, |
687fcc4a | 669 | trace_event_name(&tu->tp.call), tu->nhit); |
f3f096cf SD |
670 | return 0; |
671 | } | |
672 | ||
673 | static const struct seq_operations profile_seq_op = { | |
674 | .start = probes_seq_start, | |
675 | .next = probes_seq_next, | |
676 | .stop = probes_seq_stop, | |
677 | .show = probes_profile_seq_show | |
678 | }; | |
679 | ||
680 | static int profile_open(struct inode *inode, struct file *file) | |
681 | { | |
682 | return seq_open(file, &profile_seq_op); | |
683 | } | |
684 | ||
685 | static const struct file_operations uprobe_profile_ops = { | |
686 | .owner = THIS_MODULE, | |
687 | .open = profile_open, | |
688 | .read = seq_read, | |
689 | .llseek = seq_lseek, | |
690 | .release = seq_release, | |
691 | }; | |
692 | ||
dcad1a20 NK |
693 | struct uprobe_cpu_buffer { |
694 | struct mutex mutex; | |
695 | void *buf; | |
696 | }; | |
697 | static struct uprobe_cpu_buffer __percpu *uprobe_cpu_buffer; | |
698 | static int uprobe_buffer_refcnt; | |
699 | ||
700 | static int uprobe_buffer_init(void) | |
701 | { | |
702 | int cpu, err_cpu; | |
703 | ||
704 | uprobe_cpu_buffer = alloc_percpu(struct uprobe_cpu_buffer); | |
705 | if (uprobe_cpu_buffer == NULL) | |
706 | return -ENOMEM; | |
707 | ||
708 | for_each_possible_cpu(cpu) { | |
709 | struct page *p = alloc_pages_node(cpu_to_node(cpu), | |
710 | GFP_KERNEL, 0); | |
711 | if (p == NULL) { | |
712 | err_cpu = cpu; | |
713 | goto err; | |
714 | } | |
715 | per_cpu_ptr(uprobe_cpu_buffer, cpu)->buf = page_address(p); | |
716 | mutex_init(&per_cpu_ptr(uprobe_cpu_buffer, cpu)->mutex); | |
717 | } | |
718 | ||
719 | return 0; | |
720 | ||
721 | err: | |
722 | for_each_possible_cpu(cpu) { | |
723 | if (cpu == err_cpu) | |
724 | break; | |
725 | free_page((unsigned long)per_cpu_ptr(uprobe_cpu_buffer, cpu)->buf); | |
726 | } | |
727 | ||
728 | free_percpu(uprobe_cpu_buffer); | |
729 | return -ENOMEM; | |
730 | } | |
731 | ||
732 | static int uprobe_buffer_enable(void) | |
733 | { | |
734 | int ret = 0; | |
735 | ||
736 | BUG_ON(!mutex_is_locked(&event_mutex)); | |
737 | ||
738 | if (uprobe_buffer_refcnt++ == 0) { | |
739 | ret = uprobe_buffer_init(); | |
740 | if (ret < 0) | |
741 | uprobe_buffer_refcnt--; | |
742 | } | |
743 | ||
744 | return ret; | |
745 | } | |
746 | ||
747 | static void uprobe_buffer_disable(void) | |
748 | { | |
6ea6215f J |
749 | int cpu; |
750 | ||
dcad1a20 NK |
751 | BUG_ON(!mutex_is_locked(&event_mutex)); |
752 | ||
753 | if (--uprobe_buffer_refcnt == 0) { | |
6ea6215f J |
754 | for_each_possible_cpu(cpu) |
755 | free_page((unsigned long)per_cpu_ptr(uprobe_cpu_buffer, | |
756 | cpu)->buf); | |
757 | ||
dcad1a20 NK |
758 | free_percpu(uprobe_cpu_buffer); |
759 | uprobe_cpu_buffer = NULL; | |
760 | } | |
761 | } | |
762 | ||
763 | static struct uprobe_cpu_buffer *uprobe_buffer_get(void) | |
764 | { | |
765 | struct uprobe_cpu_buffer *ucb; | |
766 | int cpu; | |
767 | ||
768 | cpu = raw_smp_processor_id(); | |
769 | ucb = per_cpu_ptr(uprobe_cpu_buffer, cpu); | |
770 | ||
771 | /* | |
772 | * Use per-cpu buffers for fastest access, but we might migrate | |
773 | * so the mutex makes sure we have sole access to it. | |
774 | */ | |
775 | mutex_lock(&ucb->mutex); | |
776 | ||
777 | return ucb; | |
778 | } | |
779 | ||
780 | static void uprobe_buffer_put(struct uprobe_cpu_buffer *ucb) | |
781 | { | |
782 | mutex_unlock(&ucb->mutex); | |
783 | } | |
784 | ||
a43b9704 | 785 | static void __uprobe_trace_func(struct trace_uprobe *tu, |
dd9fa555 | 786 | unsigned long func, struct pt_regs *regs, |
70ed91c6 | 787 | struct uprobe_cpu_buffer *ucb, int dsize, |
7f1d2f82 | 788 | struct trace_event_file *trace_file) |
f3f096cf SD |
789 | { |
790 | struct uprobe_trace_entry_head *entry; | |
791 | struct ring_buffer_event *event; | |
792 | struct ring_buffer *buffer; | |
457d1772 | 793 | void *data; |
dd9fa555 | 794 | int size, esize; |
2425bcb9 | 795 | struct trace_event_call *call = &tu->tp.call; |
f3f096cf | 796 | |
7f1d2f82 | 797 | WARN_ON(call != trace_file->event_call); |
70ed91c6 | 798 | |
dd9fa555 | 799 | if (WARN_ON_ONCE(tu->tp.size + dsize > PAGE_SIZE)) |
dcad1a20 NK |
800 | return; |
801 | ||
09a5059a | 802 | if (trace_trigger_soft_disabled(trace_file)) |
ca3b1620 NK |
803 | return; |
804 | ||
dd9fa555 | 805 | esize = SIZEOF_TRACE_ENTRY(is_ret_probe(tu)); |
dcad1a20 | 806 | size = esize + tu->tp.size + dsize; |
7f1d2f82 | 807 | event = trace_event_buffer_lock_reserve(&buffer, trace_file, |
70ed91c6 | 808 | call->event.type, size, 0, 0); |
f3f096cf | 809 | if (!event) |
dd9fa555 | 810 | return; |
f3f096cf SD |
811 | |
812 | entry = ring_buffer_event_data(event); | |
393a736c ON |
813 | if (is_ret_probe(tu)) { |
814 | entry->vaddr[0] = func; | |
815 | entry->vaddr[1] = instruction_pointer(regs); | |
816 | data = DATAOF_TRACE_ENTRY(entry, true); | |
817 | } else { | |
818 | entry->vaddr[0] = instruction_pointer(regs); | |
819 | data = DATAOF_TRACE_ENTRY(entry, false); | |
820 | } | |
821 | ||
dcad1a20 | 822 | memcpy(data, ucb->buf, tu->tp.size + dsize); |
f3f096cf | 823 | |
7f1d2f82 | 824 | event_trigger_unlock_commit(trace_file, buffer, event, entry, 0, 0); |
a51cc604 | 825 | } |
f42d24a1 | 826 | |
a51cc604 | 827 | /* uprobe handler */ |
dd9fa555 NK |
828 | static int uprobe_trace_func(struct trace_uprobe *tu, struct pt_regs *regs, |
829 | struct uprobe_cpu_buffer *ucb, int dsize) | |
a51cc604 | 830 | { |
70ed91c6 J |
831 | struct event_file_link *link; |
832 | ||
833 | if (is_ret_probe(tu)) | |
834 | return 0; | |
835 | ||
836 | rcu_read_lock(); | |
837 | list_for_each_entry_rcu(link, &tu->tp.files, list) | |
838 | __uprobe_trace_func(tu, 0, regs, ucb, dsize, link->file); | |
839 | rcu_read_unlock(); | |
840 | ||
f42d24a1 | 841 | return 0; |
f3f096cf SD |
842 | } |
843 | ||
c1ae5c75 | 844 | static void uretprobe_trace_func(struct trace_uprobe *tu, unsigned long func, |
dd9fa555 NK |
845 | struct pt_regs *regs, |
846 | struct uprobe_cpu_buffer *ucb, int dsize) | |
c1ae5c75 | 847 | { |
70ed91c6 J |
848 | struct event_file_link *link; |
849 | ||
850 | rcu_read_lock(); | |
851 | list_for_each_entry_rcu(link, &tu->tp.files, list) | |
852 | __uprobe_trace_func(tu, func, regs, ucb, dsize, link->file); | |
853 | rcu_read_unlock(); | |
c1ae5c75 ON |
854 | } |
855 | ||
f3f096cf SD |
856 | /* Event entry printers */ |
857 | static enum print_line_t | |
858 | print_uprobe_event(struct trace_iterator *iter, int flags, struct trace_event *event) | |
859 | { | |
457d1772 | 860 | struct uprobe_trace_entry_head *entry; |
f3f096cf SD |
861 | struct trace_seq *s = &iter->seq; |
862 | struct trace_uprobe *tu; | |
863 | u8 *data; | |
864 | int i; | |
865 | ||
457d1772 | 866 | entry = (struct uprobe_trace_entry_head *)iter->ent; |
14577c39 | 867 | tu = container_of(event, struct trace_uprobe, tp.call.event); |
f3f096cf | 868 | |
3ede82dd | 869 | if (is_ret_probe(tu)) { |
8579a107 | 870 | trace_seq_printf(s, "%s: (0x%lx <- 0x%lx)", |
687fcc4a | 871 | trace_event_name(&tu->tp.call), |
8579a107 | 872 | entry->vaddr[1], entry->vaddr[0]); |
3ede82dd ON |
873 | data = DATAOF_TRACE_ENTRY(entry, true); |
874 | } else { | |
8579a107 | 875 | trace_seq_printf(s, "%s: (0x%lx)", |
687fcc4a | 876 | trace_event_name(&tu->tp.call), |
8579a107 | 877 | entry->vaddr[0]); |
3ede82dd ON |
878 | data = DATAOF_TRACE_ENTRY(entry, false); |
879 | } | |
f3f096cf | 880 | |
14577c39 NK |
881 | for (i = 0; i < tu->tp.nr_args; i++) { |
882 | struct probe_arg *parg = &tu->tp.args[i]; | |
883 | ||
884 | if (!parg->type->print(s, parg->name, data + parg->offset, entry)) | |
8579a107 | 885 | goto out; |
f3f096cf SD |
886 | } |
887 | ||
8579a107 | 888 | trace_seq_putc(s, '\n'); |
f3f096cf | 889 | |
8579a107 SRRH |
890 | out: |
891 | return trace_handle_return(s); | |
f3f096cf SD |
892 | } |
893 | ||
31ba3348 ON |
894 | typedef bool (*filter_func_t)(struct uprobe_consumer *self, |
895 | enum uprobe_filter_ctx ctx, | |
896 | struct mm_struct *mm); | |
897 | ||
898 | static int | |
7f1d2f82 | 899 | probe_event_enable(struct trace_uprobe *tu, struct trace_event_file *file, |
70ed91c6 | 900 | filter_func_t filter) |
f3f096cf | 901 | { |
70ed91c6 J |
902 | bool enabled = trace_probe_is_enabled(&tu->tp); |
903 | struct event_file_link *link = NULL; | |
904 | int ret; | |
905 | ||
906 | if (file) { | |
48212542 ON |
907 | if (tu->tp.flags & TP_FLAG_PROFILE) |
908 | return -EINTR; | |
909 | ||
70ed91c6 J |
910 | link = kmalloc(sizeof(*link), GFP_KERNEL); |
911 | if (!link) | |
912 | return -ENOMEM; | |
913 | ||
914 | link->file = file; | |
915 | list_add_tail_rcu(&link->list, &tu->tp.files); | |
916 | ||
917 | tu->tp.flags |= TP_FLAG_TRACE; | |
48212542 ON |
918 | } else { |
919 | if (tu->tp.flags & TP_FLAG_TRACE) | |
920 | return -EINTR; | |
921 | ||
70ed91c6 | 922 | tu->tp.flags |= TP_FLAG_PROFILE; |
48212542 | 923 | } |
f3f096cf | 924 | |
736288ba ON |
925 | WARN_ON(!uprobe_filter_is_empty(&tu->filter)); |
926 | ||
70ed91c6 J |
927 | if (enabled) |
928 | return 0; | |
929 | ||
fb6bab6a ON |
930 | ret = uprobe_buffer_enable(); |
931 | if (ret) | |
932 | goto err_flags; | |
933 | ||
31ba3348 | 934 | tu->consumer.filter = filter; |
a932b738 | 935 | ret = uprobe_register(tu->inode, tu->offset, &tu->consumer); |
fb6bab6a ON |
936 | if (ret) |
937 | goto err_buffer; | |
938 | ||
939 | return 0; | |
940 | ||
941 | err_buffer: | |
942 | uprobe_buffer_disable(); | |
f3f096cf | 943 | |
fb6bab6a ON |
944 | err_flags: |
945 | if (file) { | |
946 | list_del(&link->list); | |
947 | kfree(link); | |
948 | tu->tp.flags &= ~TP_FLAG_TRACE; | |
949 | } else { | |
950 | tu->tp.flags &= ~TP_FLAG_PROFILE; | |
951 | } | |
4161824f | 952 | return ret; |
f3f096cf SD |
953 | } |
954 | ||
70ed91c6 | 955 | static void |
7f1d2f82 | 956 | probe_event_disable(struct trace_uprobe *tu, struct trace_event_file *file) |
f3f096cf | 957 | { |
14577c39 | 958 | if (!trace_probe_is_enabled(&tu->tp)) |
f3f096cf SD |
959 | return; |
960 | ||
70ed91c6 J |
961 | if (file) { |
962 | struct event_file_link *link; | |
963 | ||
964 | link = find_event_file_link(&tu->tp, file); | |
965 | if (!link) | |
966 | return; | |
967 | ||
968 | list_del_rcu(&link->list); | |
969 | /* synchronize with u{,ret}probe_trace_func */ | |
970 | synchronize_sched(); | |
971 | kfree(link); | |
972 | ||
973 | if (!list_empty(&tu->tp.files)) | |
974 | return; | |
975 | } | |
976 | ||
736288ba ON |
977 | WARN_ON(!uprobe_filter_is_empty(&tu->filter)); |
978 | ||
a932b738 | 979 | uprobe_unregister(tu->inode, tu->offset, &tu->consumer); |
70ed91c6 | 980 | tu->tp.flags &= file ? ~TP_FLAG_TRACE : ~TP_FLAG_PROFILE; |
dcad1a20 NK |
981 | |
982 | uprobe_buffer_disable(); | |
f3f096cf SD |
983 | } |
984 | ||
2425bcb9 | 985 | static int uprobe_event_define_fields(struct trace_event_call *event_call) |
f3f096cf | 986 | { |
457d1772 | 987 | int ret, i, size; |
f3f096cf | 988 | struct uprobe_trace_entry_head field; |
457d1772 | 989 | struct trace_uprobe *tu = event_call->data; |
f3f096cf | 990 | |
4d1298e2 ON |
991 | if (is_ret_probe(tu)) { |
992 | DEFINE_FIELD(unsigned long, vaddr[0], FIELD_STRING_FUNC, 0); | |
993 | DEFINE_FIELD(unsigned long, vaddr[1], FIELD_STRING_RETIP, 0); | |
994 | size = SIZEOF_TRACE_ENTRY(true); | |
995 | } else { | |
996 | DEFINE_FIELD(unsigned long, vaddr[0], FIELD_STRING_IP, 0); | |
997 | size = SIZEOF_TRACE_ENTRY(false); | |
998 | } | |
f3f096cf | 999 | /* Set argument names as fields */ |
14577c39 NK |
1000 | for (i = 0; i < tu->tp.nr_args; i++) { |
1001 | struct probe_arg *parg = &tu->tp.args[i]; | |
1002 | ||
1003 | ret = trace_define_field(event_call, parg->type->fmttype, | |
1004 | parg->name, size + parg->offset, | |
1005 | parg->type->size, parg->type->is_signed, | |
f3f096cf SD |
1006 | FILTER_OTHER); |
1007 | ||
1008 | if (ret) | |
1009 | return ret; | |
1010 | } | |
1011 | return 0; | |
1012 | } | |
1013 | ||
f3f096cf | 1014 | #ifdef CONFIG_PERF_EVENTS |
31ba3348 ON |
1015 | static bool |
1016 | __uprobe_perf_filter(struct trace_uprobe_filter *filter, struct mm_struct *mm) | |
1017 | { | |
1018 | struct perf_event *event; | |
1019 | ||
1020 | if (filter->nr_systemwide) | |
1021 | return true; | |
1022 | ||
1023 | list_for_each_entry(event, &filter->perf_events, hw.tp_list) { | |
50f16a8b | 1024 | if (event->hw.target->mm == mm) |
31ba3348 ON |
1025 | return true; |
1026 | } | |
1027 | ||
1028 | return false; | |
1029 | } | |
1030 | ||
b2fe8ba6 ON |
1031 | static inline bool |
1032 | uprobe_filter_event(struct trace_uprobe *tu, struct perf_event *event) | |
1033 | { | |
50f16a8b | 1034 | return __uprobe_perf_filter(&tu->filter, event->hw.target->mm); |
b2fe8ba6 ON |
1035 | } |
1036 | ||
ce5f36a5 | 1037 | static int uprobe_perf_close(struct trace_uprobe *tu, struct perf_event *event) |
736288ba | 1038 | { |
b2fe8ba6 ON |
1039 | bool done; |
1040 | ||
736288ba | 1041 | write_lock(&tu->filter.rwlock); |
50f16a8b | 1042 | if (event->hw.target) { |
ce5f36a5 | 1043 | list_del(&event->hw.tp_list); |
b2fe8ba6 | 1044 | done = tu->filter.nr_systemwide || |
50f16a8b | 1045 | (event->hw.target->flags & PF_EXITING) || |
b2fe8ba6 | 1046 | uprobe_filter_event(tu, event); |
b2fe8ba6 | 1047 | } else { |
ce5f36a5 | 1048 | tu->filter.nr_systemwide--; |
b2fe8ba6 | 1049 | done = tu->filter.nr_systemwide; |
b2fe8ba6 | 1050 | } |
736288ba ON |
1051 | write_unlock(&tu->filter.rwlock); |
1052 | ||
b2fe8ba6 | 1053 | if (!done) |
927d6874 | 1054 | return uprobe_apply(tu->inode, tu->offset, &tu->consumer, false); |
31ba3348 | 1055 | |
736288ba ON |
1056 | return 0; |
1057 | } | |
1058 | ||
ce5f36a5 | 1059 | static int uprobe_perf_open(struct trace_uprobe *tu, struct perf_event *event) |
736288ba | 1060 | { |
b2fe8ba6 | 1061 | bool done; |
927d6874 | 1062 | int err; |
b2fe8ba6 | 1063 | |
736288ba | 1064 | write_lock(&tu->filter.rwlock); |
50f16a8b | 1065 | if (event->hw.target) { |
ce5f36a5 ON |
1066 | /* |
1067 | * event->parent != NULL means copy_process(), we can avoid | |
1068 | * uprobe_apply(). current->mm must be probed and we can rely | |
1069 | * on dup_mmap() which preserves the already installed bp's. | |
1070 | * | |
1071 | * attr.enable_on_exec means that exec/mmap will install the | |
1072 | * breakpoints we need. | |
1073 | */ | |
b2fe8ba6 | 1074 | done = tu->filter.nr_systemwide || |
ce5f36a5 | 1075 | event->parent || event->attr.enable_on_exec || |
b2fe8ba6 | 1076 | uprobe_filter_event(tu, event); |
ce5f36a5 | 1077 | list_add(&event->hw.tp_list, &tu->filter.perf_events); |
b2fe8ba6 | 1078 | } else { |
b2fe8ba6 | 1079 | done = tu->filter.nr_systemwide; |
ce5f36a5 | 1080 | tu->filter.nr_systemwide++; |
b2fe8ba6 | 1081 | } |
736288ba ON |
1082 | write_unlock(&tu->filter.rwlock); |
1083 | ||
927d6874 ON |
1084 | err = 0; |
1085 | if (!done) { | |
1086 | err = uprobe_apply(tu->inode, tu->offset, &tu->consumer, true); | |
1087 | if (err) | |
1088 | uprobe_perf_close(tu, event); | |
1089 | } | |
1090 | return err; | |
736288ba ON |
1091 | } |
1092 | ||
31ba3348 ON |
1093 | static bool uprobe_perf_filter(struct uprobe_consumer *uc, |
1094 | enum uprobe_filter_ctx ctx, struct mm_struct *mm) | |
1095 | { | |
1096 | struct trace_uprobe *tu; | |
1097 | int ret; | |
1098 | ||
1099 | tu = container_of(uc, struct trace_uprobe, consumer); | |
1100 | read_lock(&tu->filter.rwlock); | |
1101 | ret = __uprobe_perf_filter(&tu->filter, mm); | |
1102 | read_unlock(&tu->filter.rwlock); | |
1103 | ||
1104 | return ret; | |
1105 | } | |
1106 | ||
a43b9704 | 1107 | static void __uprobe_perf_func(struct trace_uprobe *tu, |
dd9fa555 NK |
1108 | unsigned long func, struct pt_regs *regs, |
1109 | struct uprobe_cpu_buffer *ucb, int dsize) | |
f3f096cf | 1110 | { |
2425bcb9 | 1111 | struct trace_event_call *call = &tu->tp.call; |
f3f096cf | 1112 | struct uprobe_trace_entry_head *entry; |
04a22fae | 1113 | struct bpf_prog *prog = call->prog; |
f3f096cf | 1114 | struct hlist_head *head; |
457d1772 | 1115 | void *data; |
dd9fa555 | 1116 | int size, esize; |
dcad1a20 NK |
1117 | int rctx; |
1118 | ||
04a22fae WN |
1119 | if (prog && !trace_call_bpf(prog, regs)) |
1120 | return; | |
1121 | ||
dcad1a20 | 1122 | esize = SIZEOF_TRACE_ENTRY(is_ret_probe(tu)); |
f3f096cf | 1123 | |
dcad1a20 NK |
1124 | size = esize + tu->tp.size + dsize; |
1125 | size = ALIGN(size + sizeof(u32), sizeof(u64)) - sizeof(u32); | |
1126 | if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE, "profile buffer not large enough")) | |
1127 | return; | |
1128 | ||
f3f096cf | 1129 | preempt_disable(); |
515619f2 ON |
1130 | head = this_cpu_ptr(call->perf_events); |
1131 | if (hlist_empty(head)) | |
1132 | goto out; | |
1133 | ||
86038c5e | 1134 | entry = perf_trace_buf_prepare(size, call->event.type, NULL, &rctx); |
f3f096cf SD |
1135 | if (!entry) |
1136 | goto out; | |
1137 | ||
393a736c ON |
1138 | if (is_ret_probe(tu)) { |
1139 | entry->vaddr[0] = func; | |
32520b2c | 1140 | entry->vaddr[1] = instruction_pointer(regs); |
393a736c ON |
1141 | data = DATAOF_TRACE_ENTRY(entry, true); |
1142 | } else { | |
32520b2c | 1143 | entry->vaddr[0] = instruction_pointer(regs); |
393a736c ON |
1144 | data = DATAOF_TRACE_ENTRY(entry, false); |
1145 | } | |
1146 | ||
dcad1a20 NK |
1147 | memcpy(data, ucb->buf, tu->tp.size + dsize); |
1148 | ||
1149 | if (size - esize > tu->tp.size + dsize) { | |
1150 | int len = tu->tp.size + dsize; | |
14577c39 | 1151 | |
dcad1a20 | 1152 | memset(data + len, 0, size - esize - len); |
14577c39 | 1153 | } |
f3f096cf | 1154 | |
32520b2c | 1155 | perf_trace_buf_submit(entry, size, rctx, 0, 1, regs, head, NULL); |
f3f096cf SD |
1156 | out: |
1157 | preempt_enable(); | |
a51cc604 ON |
1158 | } |
1159 | ||
1160 | /* uprobe profile handler */ | |
dd9fa555 NK |
1161 | static int uprobe_perf_func(struct trace_uprobe *tu, struct pt_regs *regs, |
1162 | struct uprobe_cpu_buffer *ucb, int dsize) | |
a51cc604 ON |
1163 | { |
1164 | if (!uprobe_perf_filter(&tu->consumer, 0, current->mm)) | |
1165 | return UPROBE_HANDLER_REMOVE; | |
1166 | ||
393a736c | 1167 | if (!is_ret_probe(tu)) |
dd9fa555 | 1168 | __uprobe_perf_func(tu, 0, regs, ucb, dsize); |
f42d24a1 | 1169 | return 0; |
f3f096cf | 1170 | } |
c1ae5c75 ON |
1171 | |
1172 | static void uretprobe_perf_func(struct trace_uprobe *tu, unsigned long func, | |
dd9fa555 NK |
1173 | struct pt_regs *regs, |
1174 | struct uprobe_cpu_buffer *ucb, int dsize) | |
c1ae5c75 | 1175 | { |
dd9fa555 | 1176 | __uprobe_perf_func(tu, func, regs, ucb, dsize); |
c1ae5c75 | 1177 | } |
f3f096cf SD |
1178 | #endif /* CONFIG_PERF_EVENTS */ |
1179 | ||
70ed91c6 | 1180 | static int |
2425bcb9 | 1181 | trace_uprobe_register(struct trace_event_call *event, enum trace_reg type, |
70ed91c6 | 1182 | void *data) |
f3f096cf | 1183 | { |
457d1772 | 1184 | struct trace_uprobe *tu = event->data; |
7f1d2f82 | 1185 | struct trace_event_file *file = data; |
f3f096cf SD |
1186 | |
1187 | switch (type) { | |
1188 | case TRACE_REG_REGISTER: | |
70ed91c6 | 1189 | return probe_event_enable(tu, file, NULL); |
f3f096cf SD |
1190 | |
1191 | case TRACE_REG_UNREGISTER: | |
70ed91c6 | 1192 | probe_event_disable(tu, file); |
f3f096cf SD |
1193 | return 0; |
1194 | ||
1195 | #ifdef CONFIG_PERF_EVENTS | |
1196 | case TRACE_REG_PERF_REGISTER: | |
70ed91c6 | 1197 | return probe_event_enable(tu, NULL, uprobe_perf_filter); |
f3f096cf SD |
1198 | |
1199 | case TRACE_REG_PERF_UNREGISTER: | |
70ed91c6 | 1200 | probe_event_disable(tu, NULL); |
f3f096cf | 1201 | return 0; |
736288ba ON |
1202 | |
1203 | case TRACE_REG_PERF_OPEN: | |
1204 | return uprobe_perf_open(tu, data); | |
1205 | ||
1206 | case TRACE_REG_PERF_CLOSE: | |
1207 | return uprobe_perf_close(tu, data); | |
1208 | ||
f3f096cf SD |
1209 | #endif |
1210 | default: | |
1211 | return 0; | |
1212 | } | |
1213 | return 0; | |
1214 | } | |
1215 | ||
1216 | static int uprobe_dispatcher(struct uprobe_consumer *con, struct pt_regs *regs) | |
1217 | { | |
f3f096cf | 1218 | struct trace_uprobe *tu; |
b7e0bf34 | 1219 | struct uprobe_dispatch_data udd; |
dd9fa555 NK |
1220 | struct uprobe_cpu_buffer *ucb; |
1221 | int dsize, esize; | |
f42d24a1 | 1222 | int ret = 0; |
f3f096cf | 1223 | |
dd9fa555 | 1224 | |
a932b738 | 1225 | tu = container_of(con, struct trace_uprobe, consumer); |
1b47aefd | 1226 | tu->nhit++; |
f3f096cf | 1227 | |
b7e0bf34 NK |
1228 | udd.tu = tu; |
1229 | udd.bp_addr = instruction_pointer(regs); | |
1230 | ||
1231 | current->utask->vaddr = (unsigned long) &udd; | |
1232 | ||
dd9fa555 NK |
1233 | if (WARN_ON_ONCE(!uprobe_cpu_buffer)) |
1234 | return 0; | |
1235 | ||
1236 | dsize = __get_data_size(&tu->tp, regs); | |
1237 | esize = SIZEOF_TRACE_ENTRY(is_ret_probe(tu)); | |
1238 | ||
1239 | ucb = uprobe_buffer_get(); | |
1240 | store_trace_args(esize, &tu->tp, regs, ucb->buf, dsize); | |
1241 | ||
14577c39 | 1242 | if (tu->tp.flags & TP_FLAG_TRACE) |
dd9fa555 | 1243 | ret |= uprobe_trace_func(tu, regs, ucb, dsize); |
f3f096cf SD |
1244 | |
1245 | #ifdef CONFIG_PERF_EVENTS | |
14577c39 | 1246 | if (tu->tp.flags & TP_FLAG_PROFILE) |
dd9fa555 | 1247 | ret |= uprobe_perf_func(tu, regs, ucb, dsize); |
f3f096cf | 1248 | #endif |
dd9fa555 | 1249 | uprobe_buffer_put(ucb); |
f42d24a1 | 1250 | return ret; |
f3f096cf SD |
1251 | } |
1252 | ||
c1ae5c75 ON |
1253 | static int uretprobe_dispatcher(struct uprobe_consumer *con, |
1254 | unsigned long func, struct pt_regs *regs) | |
1255 | { | |
1256 | struct trace_uprobe *tu; | |
b7e0bf34 | 1257 | struct uprobe_dispatch_data udd; |
dd9fa555 NK |
1258 | struct uprobe_cpu_buffer *ucb; |
1259 | int dsize, esize; | |
c1ae5c75 ON |
1260 | |
1261 | tu = container_of(con, struct trace_uprobe, consumer); | |
1262 | ||
b7e0bf34 NK |
1263 | udd.tu = tu; |
1264 | udd.bp_addr = func; | |
1265 | ||
1266 | current->utask->vaddr = (unsigned long) &udd; | |
1267 | ||
dd9fa555 NK |
1268 | if (WARN_ON_ONCE(!uprobe_cpu_buffer)) |
1269 | return 0; | |
1270 | ||
1271 | dsize = __get_data_size(&tu->tp, regs); | |
1272 | esize = SIZEOF_TRACE_ENTRY(is_ret_probe(tu)); | |
1273 | ||
1274 | ucb = uprobe_buffer_get(); | |
1275 | store_trace_args(esize, &tu->tp, regs, ucb->buf, dsize); | |
1276 | ||
14577c39 | 1277 | if (tu->tp.flags & TP_FLAG_TRACE) |
dd9fa555 | 1278 | uretprobe_trace_func(tu, func, regs, ucb, dsize); |
c1ae5c75 ON |
1279 | |
1280 | #ifdef CONFIG_PERF_EVENTS | |
14577c39 | 1281 | if (tu->tp.flags & TP_FLAG_PROFILE) |
dd9fa555 | 1282 | uretprobe_perf_func(tu, func, regs, ucb, dsize); |
c1ae5c75 | 1283 | #endif |
dd9fa555 | 1284 | uprobe_buffer_put(ucb); |
c1ae5c75 ON |
1285 | return 0; |
1286 | } | |
1287 | ||
f3f096cf SD |
1288 | static struct trace_event_functions uprobe_funcs = { |
1289 | .trace = print_uprobe_event | |
1290 | }; | |
1291 | ||
1292 | static int register_uprobe_event(struct trace_uprobe *tu) | |
1293 | { | |
2425bcb9 | 1294 | struct trace_event_call *call = &tu->tp.call; |
f3f096cf SD |
1295 | int ret; |
1296 | ||
2425bcb9 | 1297 | /* Initialize trace_event_call */ |
f3f096cf SD |
1298 | INIT_LIST_HEAD(&call->class->fields); |
1299 | call->event.funcs = &uprobe_funcs; | |
1300 | call->class->define_fields = uprobe_event_define_fields; | |
1301 | ||
5bf652aa | 1302 | if (set_print_fmt(&tu->tp, is_ret_probe(tu)) < 0) |
f3f096cf SD |
1303 | return -ENOMEM; |
1304 | ||
9023c930 | 1305 | ret = register_trace_event(&call->event); |
f3f096cf SD |
1306 | if (!ret) { |
1307 | kfree(call->print_fmt); | |
1308 | return -ENODEV; | |
1309 | } | |
ede392a7 | 1310 | |
04a22fae | 1311 | call->flags = TRACE_EVENT_FL_UPROBE; |
f3f096cf SD |
1312 | call->class->reg = trace_uprobe_register; |
1313 | call->data = tu; | |
1314 | ret = trace_add_event_call(call); | |
1315 | ||
1316 | if (ret) { | |
de7b2973 | 1317 | pr_info("Failed to register uprobe event: %s\n", |
687fcc4a | 1318 | trace_event_name(call)); |
f3f096cf | 1319 | kfree(call->print_fmt); |
9023c930 | 1320 | unregister_trace_event(&call->event); |
f3f096cf SD |
1321 | } |
1322 | ||
1323 | return ret; | |
1324 | } | |
1325 | ||
c6c2401d | 1326 | static int unregister_uprobe_event(struct trace_uprobe *tu) |
f3f096cf | 1327 | { |
c6c2401d SRRH |
1328 | int ret; |
1329 | ||
f3f096cf | 1330 | /* tu->event is unregistered in trace_remove_event_call() */ |
14577c39 | 1331 | ret = trace_remove_event_call(&tu->tp.call); |
c6c2401d SRRH |
1332 | if (ret) |
1333 | return ret; | |
14577c39 NK |
1334 | kfree(tu->tp.call.print_fmt); |
1335 | tu->tp.call.print_fmt = NULL; | |
c6c2401d | 1336 | return 0; |
f3f096cf SD |
1337 | } |
1338 | ||
1339 | /* Make a trace interface for controling probe points */ | |
1340 | static __init int init_uprobe_trace(void) | |
1341 | { | |
1342 | struct dentry *d_tracer; | |
1343 | ||
1344 | d_tracer = tracing_init_dentry(); | |
14a5ae40 | 1345 | if (IS_ERR(d_tracer)) |
f3f096cf SD |
1346 | return 0; |
1347 | ||
1348 | trace_create_file("uprobe_events", 0644, d_tracer, | |
1349 | NULL, &uprobe_events_ops); | |
1350 | /* Profile interface */ | |
1351 | trace_create_file("uprobe_profile", 0444, d_tracer, | |
1352 | NULL, &uprobe_profile_ops); | |
1353 | return 0; | |
1354 | } | |
1355 | ||
1356 | fs_initcall(init_uprobe_trace); |