tracing: Add additional marks to signal very large time deltas

Currently, function graph tracer prints "!" or "+" just before
function execution time to signal a function overhead, depending
on the time. And some tracers tracing latency also print "!" or
"+" just after time to signal overhead, depending on the interval
between events. Even it is usually enough to do that, we sometimes
need to signal for bigger execution time than 100 micro seconds.

For example, I used function graph tracer to detect if there is
any case that exit_mm() takes too much time. I did following steps
in /sys/kernel/debug/tracing. It was easier to detect very large
excution time with patched kernel than with original kernel.

$ echo exit_mm > set_graph_function
$ echo function_graph > current_tracer
$ echo > trace
$ cat trace_pipe > $LOGFILE
 ... (do something and terminate logging)
$ grep "\\$" $LOGFILE
 3) $ 22082032 us |                      } /* kernel_map_pages */
 3) $ 22082040 us |                    } /* free_pages_prepare */
 3) $ 22082113 us |                  } /* free_hot_cold_page */
 3) $ 22083455 us |                } /* free_hot_cold_page_list */
 3) $ 22083895 us |              } /* release_pages */
 3) $ 22177873 us |            } /* free_pages_and_swap_cache */
 3) $ 22178929 us |          } /* unmap_single_vma */
 3) $ 22198885 us |        } /* unmap_vmas */
 3) $ 22206949 us |      } /* exit_mmap */
 3) $ 22207659 us |    } /* mmput */
 3) $ 22207793 us |  } /* exit_mm */

And then, it was easy to find out that a schedule-out occured by
sub_preempt_count() within kernel_map_pages().

To detect very large function exection time caused by either problematic
function implementation or scheduling issues, this patch can be useful.

Link: http://lkml.kernel.org/r/1416789259-24038-1-git-send-email-byungchul.park@lge.com

Signed-off-by: Byungchul Park <byungchul.park@lge.com>
Signed-off-by: Steven Rostedt <rostedt@goodmis.org>
This commit is contained in:
Byungchul Park 2014-11-24 09:34:19 +09:00 committed by Steven Rostedt
parent 3e6fb8e943
commit 8e1e1df29d
4 changed files with 41 additions and 28 deletions

View File

@ -685,9 +685,11 @@ The above is mostly meaningful for kernel developers.
needs to be fixed to be only relative to the same CPU. needs to be fixed to be only relative to the same CPU.
The marks are determined by the difference between this The marks are determined by the difference between this
current trace and the next trace. current trace and the next trace.
'!' - greater than preempt_mark_thresh (default 100) '$' - greater than 1 second
'+' - greater than 1 microsecond '#' - greater than 1000 microsecond
' ' - less than or equal to 1 microsecond. '!' - greater than 100 microsecond
'+' - greater than 10 microsecond
' ' - less than or equal to 10 microsecond.
The rest is the same as the 'trace' file. The rest is the same as the 'trace' file.
@ -1956,6 +1958,8 @@ want, depending on your needs.
+ means that the function exceeded 10 usecs. + means that the function exceeded 10 usecs.
! means that the function exceeded 100 usecs. ! means that the function exceeded 100 usecs.
# means that the function exceeded 1000 usecs.
$ means that the function exceeded 1 sec.
- The task/pid field displays the thread cmdline and pid which - The task/pid field displays the thread cmdline and pid which

View File

@ -708,6 +708,8 @@ enum print_line_t print_trace_line(struct trace_iterator *iter);
extern unsigned long trace_flags; extern unsigned long trace_flags;
extern char trace_find_mark(unsigned long long duration);
/* Standard output formatting function used for function return traces */ /* Standard output formatting function used for function return traces */
#ifdef CONFIG_FUNCTION_GRAPH_TRACER #ifdef CONFIG_FUNCTION_GRAPH_TRACER

View File

@ -730,8 +730,6 @@ static void
print_graph_duration(unsigned long long duration, struct trace_seq *s, print_graph_duration(unsigned long long duration, struct trace_seq *s,
u32 flags) u32 flags)
{ {
bool duration_printed = false;
if (!(flags & TRACE_GRAPH_PRINT_DURATION) || if (!(flags & TRACE_GRAPH_PRINT_DURATION) ||
!(trace_flags & TRACE_ITER_CONTEXT_INFO)) !(trace_flags & TRACE_ITER_CONTEXT_INFO))
return; return;
@ -750,24 +748,9 @@ print_graph_duration(unsigned long long duration, struct trace_seq *s,
} }
/* Signal a overhead of time execution to the output */ /* Signal a overhead of time execution to the output */
if (flags & TRACE_GRAPH_PRINT_OVERHEAD) { if (flags & TRACE_GRAPH_PRINT_OVERHEAD)
/* Duration exceeded 100 usecs */ trace_seq_printf(s, "%c ", trace_find_mark(duration));
if (duration > 100000ULL) { else
trace_seq_puts(s, "! ");
duration_printed = true;
/* Duration exceeded 10 usecs */
} else if (duration > 10000ULL) {
trace_seq_puts(s, "+ ");
duration_printed = true;
}
}
/*
* If we did not exceed the duration tresholds or we dont want
* to print out the overhead. Either way we need to fill out the space.
*/
if (!duration_printed)
trace_seq_puts(s, " "); trace_seq_puts(s, " ");
trace_print_graph_duration(duration, s); trace_print_graph_duration(duration, s);

View File

@ -115,7 +115,7 @@ ftrace_print_symbols_seq(struct trace_seq *p, unsigned long val,
if (ret == (const char *)(trace_seq_buffer_ptr(p))) if (ret == (const char *)(trace_seq_buffer_ptr(p)))
trace_seq_printf(p, "0x%lx", val); trace_seq_printf(p, "0x%lx", val);
trace_seq_putc(p, 0); trace_seq_putc(p, 0);
return ret; return ret;
@ -443,7 +443,32 @@ lat_print_generic(struct trace_seq *s, struct trace_entry *entry, int cpu)
return trace_print_lat_fmt(s, entry); return trace_print_lat_fmt(s, entry);
} }
static unsigned long preempt_mark_thresh_us = 100; #undef MARK
#define MARK(v, s) {.val = v, .sym = s}
/* trace overhead mark */
static const struct trace_mark {
unsigned long long val; /* unit: nsec */
char sym;
} mark[] = {
MARK(1000000000ULL , '$'), /* 1 sec */
MARK(1000000ULL , '#'), /* 1000 usecs */
MARK(100000ULL , '!'), /* 100 usecs */
MARK(10000ULL , '+'), /* 10 usecs */
};
#undef MARK
char trace_find_mark(unsigned long long d)
{
int i;
int size = ARRAY_SIZE(mark);
for (i = 0; i < size; i++) {
if (d >= mark[i].val)
break;
}
return (i == size) ? ' ' : mark[i].sym;
}
static int static int
lat_print_timestamp(struct trace_iterator *iter, u64 next_ts) lat_print_timestamp(struct trace_iterator *iter, u64 next_ts)
@ -480,8 +505,7 @@ lat_print_timestamp(struct trace_iterator *iter, u64 next_ts)
trace_seq_printf( trace_seq_printf(
s, " %4lldus%c: ", s, " %4lldus%c: ",
abs_ts, abs_ts,
rel_ts > preempt_mark_thresh_us ? '!' : trace_find_mark(rel_ts * NSEC_PER_USEC));
rel_ts > 1 ? '+' : ' ');
} else { /* !verbose && !in_ns */ } else { /* !verbose && !in_ns */
trace_seq_printf(s, " %4lld: ", abs_ts); trace_seq_printf(s, " %4lld: ", abs_ts);
@ -663,7 +687,7 @@ int register_ftrace_event(struct trace_event *event)
goto out; goto out;
} else { } else {
event->type = next_event_type++; event->type = next_event_type++;
list = &ftrace_event_list; list = &ftrace_event_list;
} }