Skip to content

Commit cd26ea6

Browse files
committed
perf trace: Fix setting of augmented payload when using eBPF + raw_syscalls
For now with BPF raw_augmented we hook into raw_syscalls:sys_enter and there we get all 6 syscall args plus the tracepoint common fields (sizeof(long)) and the syscall_nr (another long). So we check if that is the case and if so don't look after the sc->args_size, but always after the full raw_syscalls:sys_enter payload, which is fixed. We'll revisit this later to pass s->args_size to the BPF augmenter (now tools/perf/examples/bpf/augmented_raw_syscalls.c, so that it copies only what we need for each syscall, like what happens when we use syscalls:sys_enter_NAME, so that we reduce the kernel/userspace traffic to just what is needed for each syscall. Cc: Adrian Hunter <adrian.hunter@intel.com> Cc: David Ahern <dsahern@gmail.com> Cc: Jiri Olsa <jolsa@kernel.org> Cc: Namhyung Kim <namhyung@kernel.org> Cc: Wang Nan <wangnan0@huawei.com> Link: https://lkml.kernel.org/n/tip-nlslrg8apxdsobt4pwl3n7ur@git.kernel.org Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
1 parent 3c5e3da commit cd26ea6

File tree

1 file changed

+30
-7
lines changed

1 file changed

+30
-7
lines changed

tools/perf/builtin-trace.c

Lines changed: 30 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -108,6 +108,7 @@ struct trace {
108108
} stats;
109109
unsigned int max_stack;
110110
unsigned int min_stack;
111+
bool raw_augmented_syscalls;
111112
bool not_ev_qualifier;
112113
bool live;
113114
bool full_time;
@@ -1724,13 +1725,28 @@ static int trace__fprintf_sample(struct trace *trace, struct perf_evsel *evsel,
17241725
return printed;
17251726
}
17261727

1727-
static void *syscall__augmented_args(struct syscall *sc, struct perf_sample *sample, int *augmented_args_size)
1728+
static void *syscall__augmented_args(struct syscall *sc, struct perf_sample *sample, int *augmented_args_size, bool raw_augmented)
17281729
{
17291730
void *augmented_args = NULL;
1731+
/*
1732+
* For now with BPF raw_augmented we hook into raw_syscalls:sys_enter
1733+
* and there we get all 6 syscall args plus the tracepoint common
1734+
* fields (sizeof(long)) and the syscall_nr (another long). So we check
1735+
* if that is the case and if so don't look after the sc->args_size,
1736+
* but always after the full raw_syscalls:sys_enter payload, which is
1737+
* fixed.
1738+
*
1739+
* We'll revisit this later to pass s->args_size to the BPF augmenter
1740+
* (now tools/perf/examples/bpf/augmented_raw_syscalls.c, so that it
1741+
* copies only what we need for each syscall, like what happens when we
1742+
* use syscalls:sys_enter_NAME, so that we reduce the kernel/userspace
1743+
* traffic to just what is needed for each syscall.
1744+
*/
1745+
int args_size = raw_augmented ? (8 * (int)sizeof(long)) : sc->args_size;
17301746

1731-
*augmented_args_size = sample->raw_size - sc->args_size;
1747+
*augmented_args_size = sample->raw_size - args_size;
17321748
if (*augmented_args_size > 0)
1733-
augmented_args = sample->raw_data + sc->args_size;
1749+
augmented_args = sample->raw_data + args_size;
17341750

17351751
return augmented_args;
17361752
}
@@ -1780,7 +1796,7 @@ static int trace__sys_enter(struct trace *trace, struct perf_evsel *evsel,
17801796
* here and avoid using augmented syscalls when the evsel is the raw_syscalls one.
17811797
*/
17821798
if (evsel != trace->syscalls.events.sys_enter)
1783-
augmented_args = syscall__augmented_args(sc, sample, &augmented_args_size);
1799+
augmented_args = syscall__augmented_args(sc, sample, &augmented_args_size, trace->raw_augmented_syscalls);
17841800
ttrace->entry_time = sample->time;
17851801
msg = ttrace->entry_str;
17861802
printed += scnprintf(msg + printed, trace__entry_str_size - printed, "%s(", sc->name);
@@ -1833,7 +1849,7 @@ static int trace__fprintf_sys_enter(struct trace *trace, struct perf_evsel *evse
18331849
goto out_put;
18341850

18351851
args = perf_evsel__sc_tp_ptr(evsel, args, sample);
1836-
augmented_args = syscall__augmented_args(sc, sample, &augmented_args_size);
1852+
augmented_args = syscall__augmented_args(sc, sample, &augmented_args_size, trace->raw_augmented_syscalls);
18371853
syscall__scnprintf_args(sc, msg, sizeof(msg), args, augmented_args, augmented_args_size, trace, thread);
18381854
fprintf(trace->output, "%s", msg);
18391855
err = 0;
@@ -3501,8 +3517,15 @@ int cmd_trace(int argc, const char **argv)
35013517
evsel->handler = trace__sys_enter;
35023518

35033519
evlist__for_each_entry(trace.evlist, evsel) {
3504-
if (strstarts(perf_evsel__name(evsel), "syscalls:sys_exit_") ||
3505-
strcmp(perf_evsel__name(evsel), "raw_syscalls:sys_exit") == 0) {
3520+
bool raw_syscalls_sys_exit = strcmp(perf_evsel__name(evsel), "raw_syscalls:sys_exit") == 0;
3521+
3522+
if (raw_syscalls_sys_exit) {
3523+
trace.raw_augmented_syscalls = true;
3524+
goto init_augmented_syscall_tp;
3525+
}
3526+
3527+
if (strstarts(perf_evsel__name(evsel), "syscalls:sys_exit_")) {
3528+
init_augmented_syscall_tp:
35063529
perf_evsel__init_augmented_syscall_tp(evsel);
35073530
perf_evsel__init_augmented_syscall_tp_ret(evsel);
35083531
evsel->handler = trace__sys_exit;

0 commit comments

Comments
 (0)