uprobes: Fix return value in error handling path
[linux-2.6-block.git] / kernel / trace / trace_syscalls.c
CommitLineData
47788c58 1#include <trace/syscall.h>
1c569f02 2#include <trace/events/syscalls.h>
f431b634 3#include <linux/syscalls.h>
5a0e3ad6 4#include <linux/slab.h>
ee08c6ec 5#include <linux/kernel.h>
56d82e00 6#include <linux/module.h> /* for MODULE_NAME_LEN via KSYM_SYMBOL_LEN */
fb34a08c 7#include <linux/ftrace.h>
cdd6c482 8#include <linux/perf_event.h>
ee08c6ec
FW
9#include <asm/syscall.h>
10
11#include "trace_output.h"
12#include "trace.h"
13
5be71b61 14static DEFINE_MUTEX(syscall_trace_lock);
ee08c6ec 15
2239291a 16static int syscall_enter_register(struct ftrace_event_call *event,
ceec0b6f 17 enum trace_reg type, void *data);
2239291a 18static int syscall_exit_register(struct ftrace_event_call *event,
ceec0b6f 19 enum trace_reg type, void *data);
2239291a 20
2e33af02
SR
21static struct list_head *
22syscall_get_enter_fields(struct ftrace_event_call *call)
23{
24 struct syscall_metadata *entry = call->data;
25
26 return &entry->enter_fields;
27}
28
3d56e331
SR
29extern struct syscall_metadata *__start_syscalls_metadata[];
30extern struct syscall_metadata *__stop_syscalls_metadata[];
c44fc770
FW
31
32static struct syscall_metadata **syscalls_metadata;
33
b2d55496
IM
34#ifndef ARCH_HAS_SYSCALL_MATCH_SYM_NAME
35static inline bool arch_syscall_match_sym_name(const char *sym, const char *name)
36{
37 /*
38 * Only compare after the "sys" prefix. Archs that use
39 * syscall wrappers may have syscalls symbols aliases prefixed
36a78e9e 40 * with ".SyS" or ".sys" instead of "sys", leading to an unwanted
b2d55496
IM
41 * mismatch.
42 */
43 return !strcmp(sym + 3, name + 3);
44}
45#endif
46
f431b634
SR
47#ifdef ARCH_TRACE_IGNORE_COMPAT_SYSCALLS
48/*
49 * Some architectures that allow for 32bit applications
50 * to run on a 64bit kernel, do not map the syscalls for
51 * the 32bit tasks the same as they do for 64bit tasks.
52 *
53 * *cough*x86*cough*
54 *
55 * In such a case, instead of reporting the wrong syscalls,
56 * simply ignore them.
57 *
58 * For an arch to ignore the compat syscalls it needs to
59 * define ARCH_TRACE_IGNORE_COMPAT_SYSCALLS as well as
60 * define the function arch_trace_is_compat_syscall() to let
61 * the tracing system know that it should ignore it.
62 */
63static int
64trace_get_syscall_nr(struct task_struct *task, struct pt_regs *regs)
65{
66 if (unlikely(arch_trace_is_compat_syscall(regs)))
67 return -1;
68
69 return syscall_get_nr(task, regs);
70}
71#else
72static inline int
73trace_get_syscall_nr(struct task_struct *task, struct pt_regs *regs)
74{
75 return syscall_get_nr(task, regs);
76}
77#endif /* ARCH_TRACE_IGNORE_COMPAT_SYSCALLS */
78
3d56e331
SR
79static __init struct syscall_metadata *
80find_syscall_meta(unsigned long syscall)
c44fc770 81{
3d56e331
SR
82 struct syscall_metadata **start;
83 struct syscall_metadata **stop;
c44fc770
FW
84 char str[KSYM_SYMBOL_LEN];
85
86
3d56e331
SR
87 start = __start_syscalls_metadata;
88 stop = __stop_syscalls_metadata;
c44fc770
FW
89 kallsyms_lookup(syscall, NULL, NULL, NULL, str);
90
ae07f551
IM
91 if (arch_syscall_match_sym_name(str, "sys_ni_syscall"))
92 return NULL;
93
c44fc770 94 for ( ; start < stop; start++) {
b2d55496 95 if ((*start)->name && arch_syscall_match_sym_name(str, (*start)->name))
3d56e331 96 return *start;
c44fc770
FW
97 }
98 return NULL;
99}
100
101static struct syscall_metadata *syscall_nr_to_meta(int nr)
102{
103 if (!syscalls_metadata || nr >= NR_syscalls || nr < 0)
104 return NULL;
105
106 return syscalls_metadata[nr];
107}
108
6aea49cb 109static enum print_line_t
a9a57763
SR
110print_syscall_enter(struct trace_iterator *iter, int flags,
111 struct trace_event *event)
bed1ffca
FW
112{
113 struct trace_seq *s = &iter->seq;
114 struct trace_entry *ent = iter->ent;
115 struct syscall_trace_enter *trace;
116 struct syscall_metadata *entry;
117 int i, ret, syscall;
118
64c12e04 119 trace = (typeof(trace))ent;
bed1ffca 120 syscall = trace->nr;
bed1ffca 121 entry = syscall_nr_to_meta(syscall);
64c12e04 122
bed1ffca
FW
123 if (!entry)
124 goto end;
125
32c0edae 126 if (entry->enter_event->event.type != ent->type) {
64c12e04
JB
127 WARN_ON_ONCE(1);
128 goto end;
129 }
130
bed1ffca
FW
131 ret = trace_seq_printf(s, "%s(", entry->name);
132 if (!ret)
133 return TRACE_TYPE_PARTIAL_LINE;
134
135 for (i = 0; i < entry->nb_args; i++) {
136 /* parameter types */
ba8b3a40 137 if (trace_flags & TRACE_ITER_VERBOSE) {
bed1ffca
FW
138 ret = trace_seq_printf(s, "%s ", entry->types[i]);
139 if (!ret)
140 return TRACE_TYPE_PARTIAL_LINE;
141 }
142 /* parameter values */
4539f077 143 ret = trace_seq_printf(s, "%s: %lx%s", entry->args[i],
bed1ffca 144 trace->args[i],
4539f077 145 i == entry->nb_args - 1 ? "" : ", ");
bed1ffca
FW
146 if (!ret)
147 return TRACE_TYPE_PARTIAL_LINE;
148 }
149
4539f077
LZ
150 ret = trace_seq_putc(s, ')');
151 if (!ret)
152 return TRACE_TYPE_PARTIAL_LINE;
153
bed1ffca 154end:
4539f077
LZ
155 ret = trace_seq_putc(s, '\n');
156 if (!ret)
157 return TRACE_TYPE_PARTIAL_LINE;
158
bed1ffca
FW
159 return TRACE_TYPE_HANDLED;
160}
161
6aea49cb 162static enum print_line_t
a9a57763
SR
163print_syscall_exit(struct trace_iterator *iter, int flags,
164 struct trace_event *event)
bed1ffca
FW
165{
166 struct trace_seq *s = &iter->seq;
167 struct trace_entry *ent = iter->ent;
168 struct syscall_trace_exit *trace;
169 int syscall;
170 struct syscall_metadata *entry;
171 int ret;
172
64c12e04 173 trace = (typeof(trace))ent;
bed1ffca 174 syscall = trace->nr;
bed1ffca 175 entry = syscall_nr_to_meta(syscall);
64c12e04 176
bed1ffca
FW
177 if (!entry) {
178 trace_seq_printf(s, "\n");
179 return TRACE_TYPE_HANDLED;
180 }
181
32c0edae 182 if (entry->exit_event->event.type != ent->type) {
64c12e04
JB
183 WARN_ON_ONCE(1);
184 return TRACE_TYPE_UNHANDLED;
185 }
186
bed1ffca
FW
187 ret = trace_seq_printf(s, "%s -> 0x%lx\n", entry->name,
188 trace->ret);
189 if (!ret)
190 return TRACE_TYPE_PARTIAL_LINE;
191
192 return TRACE_TYPE_HANDLED;
193}
194
e6971969
LZ
195extern char *__bad_type_size(void);
196
197#define SYSCALL_FIELD(type, name) \
198 sizeof(type) != sizeof(trace.name) ? \
199 __bad_type_size() : \
26a50744
TZ
200 #type, #name, offsetof(typeof(trace), name), \
201 sizeof(trace.name), is_signed_type(type)
e6971969 202
50307a45
LJ
203static
204int __set_enter_print_fmt(struct syscall_metadata *entry, char *buf, int len)
205{
206 int i;
207 int pos = 0;
208
209 /* When len=0, we just calculate the needed length */
210#define LEN_OR_ZERO (len ? len - pos : 0)
211
212 pos += snprintf(buf + pos, LEN_OR_ZERO, "\"");
213 for (i = 0; i < entry->nb_args; i++) {
214 pos += snprintf(buf + pos, LEN_OR_ZERO, "%s: 0x%%0%zulx%s",
215 entry->args[i], sizeof(unsigned long),
216 i == entry->nb_args - 1 ? "" : ", ");
217 }
218 pos += snprintf(buf + pos, LEN_OR_ZERO, "\"");
219
220 for (i = 0; i < entry->nb_args; i++) {
221 pos += snprintf(buf + pos, LEN_OR_ZERO,
222 ", ((unsigned long)(REC->%s))", entry->args[i]);
223 }
224
225#undef LEN_OR_ZERO
226
227 /* return the length of print_fmt */
228 return pos;
229}
230
231static int set_syscall_print_fmt(struct ftrace_event_call *call)
232{
233 char *print_fmt;
234 int len;
235 struct syscall_metadata *entry = call->data;
236
237 if (entry->enter_event != call) {
238 call->print_fmt = "\"0x%lx\", REC->ret";
239 return 0;
240 }
241
242 /* First: called with 0 length to calculate the needed length */
243 len = __set_enter_print_fmt(entry, NULL, 0);
244
245 print_fmt = kmalloc(len + 1, GFP_KERNEL);
246 if (!print_fmt)
247 return -ENOMEM;
248
249 /* Second: actually write the @print_fmt */
250 __set_enter_print_fmt(entry, print_fmt, len + 1);
251 call->print_fmt = print_fmt;
252
253 return 0;
254}
255
256static void free_syscall_print_fmt(struct ftrace_event_call *call)
257{
258 struct syscall_metadata *entry = call->data;
259
260 if (entry->enter_event == call)
261 kfree(call->print_fmt);
262}
263
b8aae39f 264static int __init syscall_enter_define_fields(struct ftrace_event_call *call)
540b7b8d
LZ
265{
266 struct syscall_trace_enter trace;
31c16b13 267 struct syscall_metadata *meta = call->data;
540b7b8d 268 int ret;
540b7b8d
LZ
269 int i;
270 int offset = offsetof(typeof(trace), args);
271
0f1ef51d
LJ
272 ret = trace_define_field(call, SYSCALL_FIELD(int, nr), FILTER_OTHER);
273 if (ret)
274 return ret;
275
540b7b8d 276 for (i = 0; i < meta->nb_args; i++) {
aeaeae11
FW
277 ret = trace_define_field(call, meta->types[i],
278 meta->args[i], offset,
43b51ead
LZ
279 sizeof(unsigned long), 0,
280 FILTER_OTHER);
540b7b8d
LZ
281 offset += sizeof(unsigned long);
282 }
283
284 return ret;
285}
286
b8aae39f 287static int __init syscall_exit_define_fields(struct ftrace_event_call *call)
540b7b8d
LZ
288{
289 struct syscall_trace_exit trace;
290 int ret;
291
0f1ef51d
LJ
292 ret = trace_define_field(call, SYSCALL_FIELD(int, nr), FILTER_OTHER);
293 if (ret)
294 return ret;
295
26a50744 296 ret = trace_define_field(call, SYSCALL_FIELD(long, ret),
43b51ead 297 FILTER_OTHER);
540b7b8d
LZ
298
299 return ret;
300}
301
12ab74ee 302static void ftrace_syscall_enter(void *data, struct pt_regs *regs, long id)
ee08c6ec 303{
12ab74ee 304 struct trace_array *tr = data;
bed1ffca
FW
305 struct syscall_trace_enter *entry;
306 struct syscall_metadata *sys_data;
307 struct ring_buffer_event *event;
e77405ad 308 struct ring_buffer *buffer;
ee08c6ec 309 int syscall_nr;
f431b634 310 int size;
ee08c6ec 311
f431b634 312 syscall_nr = trace_get_syscall_nr(current, regs);
cd0980fc
HB
313 if (syscall_nr < 0)
314 return;
12ab74ee 315 if (!test_bit(syscall_nr, tr->enabled_enter_syscalls))
fb34a08c 316 return;
ee08c6ec 317
bed1ffca
FW
318 sys_data = syscall_nr_to_meta(syscall_nr);
319 if (!sys_data)
320 return;
321
322 size = sizeof(*entry) + sizeof(unsigned long) * sys_data->nb_args;
323
12883efb 324 buffer = tr->trace_buffer.buffer;
12ab74ee 325 event = trace_buffer_lock_reserve(buffer,
32c0edae 326 sys_data->enter_event->event.type, size, 0, 0);
bed1ffca
FW
327 if (!event)
328 return;
329
330 entry = ring_buffer_event_data(event);
331 entry->nr = syscall_nr;
332 syscall_get_arguments(current, regs, 0, sys_data->nb_args, entry->args);
333
e77405ad
SR
334 if (!filter_current_check_discard(buffer, sys_data->enter_event,
335 entry, event))
336 trace_current_buffer_unlock_commit(buffer, event, 0, 0);
ee08c6ec
FW
337}
338
12ab74ee 339static void ftrace_syscall_exit(void *data, struct pt_regs *regs, long ret)
ee08c6ec 340{
12ab74ee 341 struct trace_array *tr = data;
bed1ffca
FW
342 struct syscall_trace_exit *entry;
343 struct syscall_metadata *sys_data;
344 struct ring_buffer_event *event;
e77405ad 345 struct ring_buffer *buffer;
ee08c6ec
FW
346 int syscall_nr;
347
f431b634 348 syscall_nr = trace_get_syscall_nr(current, regs);
cd0980fc
HB
349 if (syscall_nr < 0)
350 return;
12ab74ee 351 if (!test_bit(syscall_nr, tr->enabled_exit_syscalls))
fb34a08c 352 return;
ee08c6ec 353
bed1ffca
FW
354 sys_data = syscall_nr_to_meta(syscall_nr);
355 if (!sys_data)
356 return;
357
12883efb 358 buffer = tr->trace_buffer.buffer;
12ab74ee 359 event = trace_buffer_lock_reserve(buffer,
32c0edae 360 sys_data->exit_event->event.type, sizeof(*entry), 0, 0);
bed1ffca
FW
361 if (!event)
362 return;
363
364 entry = ring_buffer_event_data(event);
365 entry->nr = syscall_nr;
366 entry->ret = syscall_get_return_value(current, regs);
367
e77405ad
SR
368 if (!filter_current_check_discard(buffer, sys_data->exit_event,
369 entry, event))
370 trace_current_buffer_unlock_commit(buffer, event, 0, 0);
ee08c6ec
FW
371}
372
12ab74ee
SR
373static int reg_event_syscall_enter(struct ftrace_event_file *file,
374 struct ftrace_event_call *call)
ee08c6ec 375{
12ab74ee 376 struct trace_array *tr = file->tr;
fb34a08c
JB
377 int ret = 0;
378 int num;
fb34a08c 379
c252f657 380 num = ((struct syscall_metadata *)call->data)->syscall_nr;
3773b389 381 if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
fb34a08c
JB
382 return -ENOSYS;
383 mutex_lock(&syscall_trace_lock);
12ab74ee
SR
384 if (!tr->sys_refcount_enter)
385 ret = register_trace_sys_enter(ftrace_syscall_enter, tr);
3b8e4273 386 if (!ret) {
12ab74ee
SR
387 set_bit(num, tr->enabled_enter_syscalls);
388 tr->sys_refcount_enter++;
fb34a08c
JB
389 }
390 mutex_unlock(&syscall_trace_lock);
391 return ret;
ee08c6ec
FW
392}
393
12ab74ee
SR
394static void unreg_event_syscall_enter(struct ftrace_event_file *file,
395 struct ftrace_event_call *call)
ee08c6ec 396{
12ab74ee 397 struct trace_array *tr = file->tr;
fb34a08c 398 int num;
ee08c6ec 399
c252f657 400 num = ((struct syscall_metadata *)call->data)->syscall_nr;
3773b389 401 if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
fb34a08c
JB
402 return;
403 mutex_lock(&syscall_trace_lock);
12ab74ee
SR
404 tr->sys_refcount_enter--;
405 clear_bit(num, tr->enabled_enter_syscalls);
406 if (!tr->sys_refcount_enter)
407 unregister_trace_sys_enter(ftrace_syscall_enter, tr);
fb34a08c
JB
408 mutex_unlock(&syscall_trace_lock);
409}
ee08c6ec 410
12ab74ee
SR
411static int reg_event_syscall_exit(struct ftrace_event_file *file,
412 struct ftrace_event_call *call)
ee08c6ec 413{
12ab74ee 414 struct trace_array *tr = file->tr;
fb34a08c
JB
415 int ret = 0;
416 int num;
fb34a08c 417
c252f657 418 num = ((struct syscall_metadata *)call->data)->syscall_nr;
3773b389 419 if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
fb34a08c
JB
420 return -ENOSYS;
421 mutex_lock(&syscall_trace_lock);
12ab74ee
SR
422 if (!tr->sys_refcount_exit)
423 ret = register_trace_sys_exit(ftrace_syscall_exit, tr);
3b8e4273 424 if (!ret) {
12ab74ee
SR
425 set_bit(num, tr->enabled_exit_syscalls);
426 tr->sys_refcount_exit++;
ee08c6ec 427 }
fb34a08c
JB
428 mutex_unlock(&syscall_trace_lock);
429 return ret;
430}
ee08c6ec 431
12ab74ee
SR
432static void unreg_event_syscall_exit(struct ftrace_event_file *file,
433 struct ftrace_event_call *call)
fb34a08c 434{
12ab74ee 435 struct trace_array *tr = file->tr;
fb34a08c 436 int num;
ee08c6ec 437
c252f657 438 num = ((struct syscall_metadata *)call->data)->syscall_nr;
3773b389 439 if (WARN_ON_ONCE(num < 0 || num >= NR_syscalls))
fb34a08c
JB
440 return;
441 mutex_lock(&syscall_trace_lock);
12ab74ee
SR
442 tr->sys_refcount_exit--;
443 clear_bit(num, tr->enabled_exit_syscalls);
444 if (!tr->sys_refcount_exit)
445 unregister_trace_sys_exit(ftrace_syscall_exit, tr);
fb34a08c 446 mutex_unlock(&syscall_trace_lock);
ee08c6ec 447}
fb34a08c 448
6f86ab9f 449static int init_syscall_trace(struct ftrace_event_call *call)
a1301da0
LJ
450{
451 int id;
ba976970
IM
452 int num;
453
454 num = ((struct syscall_metadata *)call->data)->syscall_nr;
455 if (num < 0 || num >= NR_syscalls) {
456 pr_debug("syscall %s metadata not mapped, disabling ftrace event\n",
457 ((struct syscall_metadata *)call->data)->name);
458 return -ENOSYS;
459 }
a1301da0 460
50307a45
LJ
461 if (set_syscall_print_fmt(call) < 0)
462 return -ENOMEM;
463
c7ef3a90
SR
464 id = trace_event_raw_init(call);
465
466 if (id < 0) {
50307a45 467 free_syscall_print_fmt(call);
c7ef3a90 468 return id;
50307a45 469 }
c7ef3a90
SR
470
471 return id;
a1301da0
LJ
472}
473
6f86ab9f
VN
474struct trace_event_functions enter_syscall_print_funcs = {
475 .trace = print_syscall_enter,
476};
477
478struct trace_event_functions exit_syscall_print_funcs = {
479 .trace = print_syscall_exit,
480};
481
523c8113 482struct ftrace_event_class __refdata event_class_syscall_enter = {
6f86ab9f
VN
483 .system = "syscalls",
484 .reg = syscall_enter_register,
485 .define_fields = syscall_enter_define_fields,
486 .get_fields = syscall_get_enter_fields,
487 .raw_init = init_syscall_trace,
488};
489
523c8113 490struct ftrace_event_class __refdata event_class_syscall_exit = {
6f86ab9f
VN
491 .system = "syscalls",
492 .reg = syscall_exit_register,
493 .define_fields = syscall_exit_define_fields,
494 .fields = LIST_HEAD_INIT(event_class_syscall_exit.fields),
495 .raw_init = init_syscall_trace,
496};
497
c763ba06 498unsigned long __init __weak arch_syscall_addr(int nr)
e7b8e675
MF
499{
500 return (unsigned long)sys_call_table[nr];
501}
502
6aea49cb 503static int __init init_ftrace_syscalls(void)
c44fc770
FW
504{
505 struct syscall_metadata *meta;
506 unsigned long addr;
507 int i;
508
47b0edcb
TM
509 syscalls_metadata = kcalloc(NR_syscalls, sizeof(*syscalls_metadata),
510 GFP_KERNEL);
c44fc770
FW
511 if (!syscalls_metadata) {
512 WARN_ON(1);
513 return -ENOMEM;
514 }
515
516 for (i = 0; i < NR_syscalls; i++) {
517 addr = arch_syscall_addr(i);
518 meta = find_syscall_meta(addr);
c252f657
LJ
519 if (!meta)
520 continue;
521
522 meta->syscall_nr = i;
c44fc770
FW
523 syscalls_metadata[i] = meta;
524 }
525
526 return 0;
527}
8781915a 528early_initcall(init_ftrace_syscalls);
c44fc770 529
07b139c8 530#ifdef CONFIG_PERF_EVENTS
19007a67 531
97d5a220
FW
532static DECLARE_BITMAP(enabled_perf_enter_syscalls, NR_syscalls);
533static DECLARE_BITMAP(enabled_perf_exit_syscalls, NR_syscalls);
534static int sys_perf_refcount_enter;
535static int sys_perf_refcount_exit;
f4b5ffcc 536
38516ab5 537static void perf_syscall_enter(void *ignore, struct pt_regs *regs, long id)
f4b5ffcc
JB
538{
539 struct syscall_metadata *sys_data;
20ab4425 540 struct syscall_trace_enter *rec;
1c024eca 541 struct hlist_head *head;
f4b5ffcc 542 int syscall_nr;
4ed7c92d 543 int rctx;
19007a67 544 int size;
f4b5ffcc 545
f431b634 546 syscall_nr = trace_get_syscall_nr(current, regs);
60916a93
WD
547 if (syscall_nr < 0)
548 return;
97d5a220 549 if (!test_bit(syscall_nr, enabled_perf_enter_syscalls))
f4b5ffcc
JB
550 return;
551
552 sys_data = syscall_nr_to_meta(syscall_nr);
553 if (!sys_data)
554 return;
555
19007a67
FW
556 /* get the size after alignment with the u32 buffer size field */
557 size = sizeof(unsigned long) * sys_data->nb_args + sizeof(*rec);
558 size = ALIGN(size + sizeof(u32), sizeof(u64));
559 size -= sizeof(u32);
560
97d5a220
FW
561 if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE,
562 "perf buffer not large enough"))
20ab4425
FW
563 return;
564
97d5a220 565 rec = (struct syscall_trace_enter *)perf_trace_buf_prepare(size,
ff5f149b 566 sys_data->enter_event->event.type, regs, &rctx);
430ad5a6
XG
567 if (!rec)
568 return;
20ab4425 569
20ab4425
FW
570 rec->nr = syscall_nr;
571 syscall_get_arguments(current, regs, 0, sys_data->nb_args,
572 (unsigned long *)&rec->args);
1c024eca 573
3771f077 574 head = this_cpu_ptr(sys_data->enter_event->perf_events);
e6dab5ff 575 perf_trace_buf_submit(rec, size, rctx, 0, 1, regs, head, NULL);
f4b5ffcc
JB
576}
577
6f86ab9f 578static int perf_sysenter_enable(struct ftrace_event_call *call)
f4b5ffcc
JB
579{
580 int ret = 0;
581 int num;
582
3bbe84e9 583 num = ((struct syscall_metadata *)call->data)->syscall_nr;
f4b5ffcc
JB
584
585 mutex_lock(&syscall_trace_lock);
97d5a220 586 if (!sys_perf_refcount_enter)
38516ab5 587 ret = register_trace_sys_enter(perf_syscall_enter, NULL);
f4b5ffcc
JB
588 if (ret) {
589 pr_info("event trace: Could not activate"
590 "syscall entry trace point");
591 } else {
97d5a220
FW
592 set_bit(num, enabled_perf_enter_syscalls);
593 sys_perf_refcount_enter++;
f4b5ffcc
JB
594 }
595 mutex_unlock(&syscall_trace_lock);
596 return ret;
597}
598
6f86ab9f 599static void perf_sysenter_disable(struct ftrace_event_call *call)
f4b5ffcc
JB
600{
601 int num;
602
3bbe84e9 603 num = ((struct syscall_metadata *)call->data)->syscall_nr;
f4b5ffcc
JB
604
605 mutex_lock(&syscall_trace_lock);
97d5a220
FW
606 sys_perf_refcount_enter--;
607 clear_bit(num, enabled_perf_enter_syscalls);
608 if (!sys_perf_refcount_enter)
38516ab5 609 unregister_trace_sys_enter(perf_syscall_enter, NULL);
f4b5ffcc
JB
610 mutex_unlock(&syscall_trace_lock);
611}
612
38516ab5 613static void perf_syscall_exit(void *ignore, struct pt_regs *regs, long ret)
f4b5ffcc
JB
614{
615 struct syscall_metadata *sys_data;
20ab4425 616 struct syscall_trace_exit *rec;
1c024eca 617 struct hlist_head *head;
f4b5ffcc 618 int syscall_nr;
4ed7c92d 619 int rctx;
20ab4425 620 int size;
f4b5ffcc 621
f431b634 622 syscall_nr = trace_get_syscall_nr(current, regs);
60916a93
WD
623 if (syscall_nr < 0)
624 return;
97d5a220 625 if (!test_bit(syscall_nr, enabled_perf_exit_syscalls))
f4b5ffcc
JB
626 return;
627
628 sys_data = syscall_nr_to_meta(syscall_nr);
629 if (!sys_data)
630 return;
631
20ab4425
FW
632 /* We can probably do that at build time */
633 size = ALIGN(sizeof(*rec) + sizeof(u32), sizeof(u64));
634 size -= sizeof(u32);
19007a67 635
20ab4425
FW
636 /*
637 * Impossible, but be paranoid with the future
638 * How to put this check outside runtime?
639 */
97d5a220
FW
640 if (WARN_ONCE(size > PERF_MAX_TRACE_SIZE,
641 "exit event has grown above perf buffer size"))
20ab4425
FW
642 return;
643
97d5a220 644 rec = (struct syscall_trace_exit *)perf_trace_buf_prepare(size,
ff5f149b 645 sys_data->exit_event->event.type, regs, &rctx);
430ad5a6
XG
646 if (!rec)
647 return;
20ab4425 648
20ab4425
FW
649 rec->nr = syscall_nr;
650 rec->ret = syscall_get_return_value(current, regs);
651
3771f077 652 head = this_cpu_ptr(sys_data->exit_event->perf_events);
e6dab5ff 653 perf_trace_buf_submit(rec, size, rctx, 0, 1, regs, head, NULL);
f4b5ffcc
JB
654}
655
6f86ab9f 656static int perf_sysexit_enable(struct ftrace_event_call *call)
f4b5ffcc
JB
657{
658 int ret = 0;
659 int num;
660
3bbe84e9 661 num = ((struct syscall_metadata *)call->data)->syscall_nr;
f4b5ffcc
JB
662
663 mutex_lock(&syscall_trace_lock);
97d5a220 664 if (!sys_perf_refcount_exit)
38516ab5 665 ret = register_trace_sys_exit(perf_syscall_exit, NULL);
f4b5ffcc
JB
666 if (ret) {
667 pr_info("event trace: Could not activate"
6574658b 668 "syscall exit trace point");
f4b5ffcc 669 } else {
97d5a220
FW
670 set_bit(num, enabled_perf_exit_syscalls);
671 sys_perf_refcount_exit++;
f4b5ffcc
JB
672 }
673 mutex_unlock(&syscall_trace_lock);
674 return ret;
675}
676
6f86ab9f 677static void perf_sysexit_disable(struct ftrace_event_call *call)
f4b5ffcc
JB
678{
679 int num;
680
3bbe84e9 681 num = ((struct syscall_metadata *)call->data)->syscall_nr;
f4b5ffcc
JB
682
683 mutex_lock(&syscall_trace_lock);
97d5a220
FW
684 sys_perf_refcount_exit--;
685 clear_bit(num, enabled_perf_exit_syscalls);
686 if (!sys_perf_refcount_exit)
38516ab5 687 unregister_trace_sys_exit(perf_syscall_exit, NULL);
f4b5ffcc
JB
688 mutex_unlock(&syscall_trace_lock);
689}
690
07b139c8 691#endif /* CONFIG_PERF_EVENTS */
f4b5ffcc 692
2239291a 693static int syscall_enter_register(struct ftrace_event_call *event,
ceec0b6f 694 enum trace_reg type, void *data)
2239291a 695{
12ab74ee
SR
696 struct ftrace_event_file *file = data;
697
2239291a
SR
698 switch (type) {
699 case TRACE_REG_REGISTER:
12ab74ee 700 return reg_event_syscall_enter(file, event);
2239291a 701 case TRACE_REG_UNREGISTER:
12ab74ee 702 unreg_event_syscall_enter(file, event);
2239291a
SR
703 return 0;
704
705#ifdef CONFIG_PERF_EVENTS
706 case TRACE_REG_PERF_REGISTER:
707 return perf_sysenter_enable(event);
708 case TRACE_REG_PERF_UNREGISTER:
709 perf_sysenter_disable(event);
710 return 0;
ceec0b6f
JO
711 case TRACE_REG_PERF_OPEN:
712 case TRACE_REG_PERF_CLOSE:
489c75c3
JO
713 case TRACE_REG_PERF_ADD:
714 case TRACE_REG_PERF_DEL:
ceec0b6f 715 return 0;
2239291a
SR
716#endif
717 }
718 return 0;
719}
720
721static int syscall_exit_register(struct ftrace_event_call *event,
ceec0b6f 722 enum trace_reg type, void *data)
2239291a 723{
12ab74ee
SR
724 struct ftrace_event_file *file = data;
725
2239291a
SR
726 switch (type) {
727 case TRACE_REG_REGISTER:
12ab74ee 728 return reg_event_syscall_exit(file, event);
2239291a 729 case TRACE_REG_UNREGISTER:
12ab74ee 730 unreg_event_syscall_exit(file, event);
2239291a
SR
731 return 0;
732
733#ifdef CONFIG_PERF_EVENTS
734 case TRACE_REG_PERF_REGISTER:
735 return perf_sysexit_enable(event);
736 case TRACE_REG_PERF_UNREGISTER:
737 perf_sysexit_disable(event);
738 return 0;
ceec0b6f
JO
739 case TRACE_REG_PERF_OPEN:
740 case TRACE_REG_PERF_CLOSE:
489c75c3
JO
741 case TRACE_REG_PERF_ADD:
742 case TRACE_REG_PERF_DEL:
ceec0b6f 743 return 0;
2239291a
SR
744#endif
745 }
746 return 0;
747}