| /*-*- Mode: C; c-basic-offset: 8; indent-tabs-mode: nil -*-*/ |
| |
| /*** |
| This file is part of systemd. |
| |
| Copyright (C) 2009-2013 Intel Corporation |
| |
| Authors: |
| Auke Kok <auke-jan.h.kok@intel.com> |
| |
| systemd is free software; you can redistribute it and/or modify it |
| under the terms of the GNU Lesser General Public License as published by |
| the Free Software Foundation; either version 2.1 of the License, or |
| (at your option) any later version. |
| |
| systemd is distributed in the hope that it will be useful, but |
| WITHOUT ANY WARRANTY; without even the implied warranty of |
| MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| Lesser General Public License for more details. |
| |
| You should have received a copy of the GNU Lesser General Public License |
| along with systemd; If not, see <http://www.gnu.org/licenses/>. |
| ***/ |
| |
| /*** |
| |
| Many thanks to those who contributed ideas and code: |
| - Ziga Mahkovec - Original bootchart author |
| - Anders Norgaard - PyBootchartgui |
| - Michael Meeks - bootchart2 |
| - Scott James Remnant - Ubuntu C-based logger |
| - Arjan van der Ven - for the idea to merge bootgraph.pl functionality |
| |
| ***/ |
| |
| #include <errno.h> |
| #include <fcntl.h> |
| #include <getopt.h> |
| #include <limits.h> |
| #include <signal.h> |
| #include <stdbool.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <string.h> |
| #include <sys/resource.h> |
| #include <time.h> |
| #include <unistd.h> |
| |
| #include "sd-journal.h" |
| |
| #include "alloc-util.h" |
| #include "bootchart.h" |
| #include "conf-parser.h" |
| #include "def.h" |
| #include "fd-util.h" |
| #include "fileio.h" |
| #include "io-util.h" |
| #include "list.h" |
| #include "macro.h" |
| #include "parse-util.h" |
| #include "path-util.h" |
| #include "store.h" |
| #include "string-util.h" |
| #include "strxcpyx.h" |
| #include "svg.h" |
| #include "util.h" |
| |
| static int exiting = 0; |
| |
| #define DEFAULT_SAMPLES_LEN 500 |
| #define DEFAULT_HZ 25.0 |
| #define DEFAULT_SCALE_X 100.0 /* 100px = 1sec */ |
| #define DEFAULT_SCALE_Y 20.0 /* 16px = 1 process bar */ |
| #define DEFAULT_INIT ROOTLIBEXECDIR "/systemd" |
| #define DEFAULT_OUTPUT "/run/log" |
| |
| /* graph defaults */ |
| bool arg_entropy = false; |
| bool arg_initcall = true; |
| bool arg_relative = false; |
| bool arg_filter = true; |
| bool arg_show_cmdline = false; |
| bool arg_show_cgroup = false; |
| bool arg_pss = false; |
| bool arg_percpu = false; |
| int arg_samples_len = DEFAULT_SAMPLES_LEN; /* we record len+1 (1 start sample) */ |
| double arg_hz = DEFAULT_HZ; |
| double arg_scale_x = DEFAULT_SCALE_X; |
| double arg_scale_y = DEFAULT_SCALE_Y; |
| |
| char arg_init_path[PATH_MAX] = DEFAULT_INIT; |
| char arg_output_path[PATH_MAX] = DEFAULT_OUTPUT; |
| |
| static void signal_handler(int sig) { |
| exiting = 1; |
| } |
| |
| #define BOOTCHART_MAX (16*1024*1024) |
| |
| static void parse_conf(void) { |
| char *init = NULL, *output = NULL; |
| const ConfigTableItem items[] = { |
| { "Bootchart", "Samples", config_parse_int, 0, &arg_samples_len }, |
| { "Bootchart", "Frequency", config_parse_double, 0, &arg_hz }, |
| { "Bootchart", "Relative", config_parse_bool, 0, &arg_relative }, |
| { "Bootchart", "Filter", config_parse_bool, 0, &arg_filter }, |
| { "Bootchart", "Output", config_parse_path, 0, &output }, |
| { "Bootchart", "Init", config_parse_path, 0, &init }, |
| { "Bootchart", "PlotMemoryUsage", config_parse_bool, 0, &arg_pss }, |
| { "Bootchart", "PlotEntropyGraph", config_parse_bool, 0, &arg_entropy }, |
| { "Bootchart", "ScaleX", config_parse_double, 0, &arg_scale_x }, |
| { "Bootchart", "ScaleY", config_parse_double, 0, &arg_scale_y }, |
| { "Bootchart", "ControlGroup", config_parse_bool, 0, &arg_show_cgroup }, |
| { "Bootchart", "PerCPU", config_parse_bool, 0, &arg_percpu }, |
| { NULL, NULL, NULL, 0, NULL } |
| }; |
| |
| config_parse_many(PKGSYSCONFDIR "/bootchart.conf", |
| CONF_PATHS_NULSTR("systemd/bootchart.conf.d"), |
| NULL, config_item_table_lookup, items, true, NULL); |
| |
| if (init != NULL) |
| strscpy(arg_init_path, sizeof(arg_init_path), init); |
| if (output != NULL) |
| strscpy(arg_output_path, sizeof(arg_output_path), output); |
| } |
| |
| static void help(void) { |
| printf("Usage: %s [OPTIONS]\n\n" |
| "Options:\n" |
| " -r --rel Record time relative to recording\n" |
| " -f --freq=FREQ Sample frequency [%g]\n" |
| " -n --samples=N Stop sampling at [%d] samples\n" |
| " -x --scale-x=N Scale the graph horizontally [%g] \n" |
| " -y --scale-y=N Scale the graph vertically [%g] \n" |
| " -p --pss Enable PSS graph (CPU intensive)\n" |
| " -e --entropy Enable the entropy_avail graph\n" |
| " -o --output=PATH Path to output files [%s]\n" |
| " -i --init=PATH Path to init executable [%s]\n" |
| " -F --no-filter Disable filtering of unimportant or ephemeral processes\n" |
| " -C --cmdline Display full command lines with arguments\n" |
| " -c --control-group Display process control group\n" |
| " --per-cpu Draw each CPU utilization and wait bar also\n" |
| " -h --help Display this message\n\n" |
| "See bootchart.conf for more information.\n", |
| program_invocation_short_name, |
| DEFAULT_HZ, |
| DEFAULT_SAMPLES_LEN, |
| DEFAULT_SCALE_X, |
| DEFAULT_SCALE_Y, |
| DEFAULT_OUTPUT, |
| DEFAULT_INIT); |
| } |
| |
| static int parse_argv(int argc, char *argv[]) { |
| |
| enum { |
| ARG_PERCPU = 0x100, |
| }; |
| |
| static const struct option options[] = { |
| {"rel", no_argument, NULL, 'r' }, |
| {"freq", required_argument, NULL, 'f' }, |
| {"samples", required_argument, NULL, 'n' }, |
| {"pss", no_argument, NULL, 'p' }, |
| {"output", required_argument, NULL, 'o' }, |
| {"init", required_argument, NULL, 'i' }, |
| {"no-filter", no_argument, NULL, 'F' }, |
| {"cmdline", no_argument, NULL, 'C' }, |
| {"control-group", no_argument, NULL, 'c' }, |
| {"help", no_argument, NULL, 'h' }, |
| {"scale-x", required_argument, NULL, 'x' }, |
| {"scale-y", required_argument, NULL, 'y' }, |
| {"entropy", no_argument, NULL, 'e' }, |
| {"per-cpu", no_argument, NULL, ARG_PERCPU}, |
| {} |
| }; |
| int c, r; |
| |
| if (getpid() == 1) |
| opterr = 0; |
| |
| while ((c = getopt_long(argc, argv, "erpf:n:o:i:FCchx:y:", options, NULL)) >= 0) |
| switch (c) { |
| |
| case 'r': |
| arg_relative = true; |
| break; |
| case 'f': |
| r = safe_atod(optarg, &arg_hz); |
| if (r < 0) |
| log_warning_errno(r, "failed to parse --freq/-f argument '%s': %m", |
| optarg); |
| break; |
| case 'F': |
| arg_filter = false; |
| break; |
| case 'C': |
| arg_show_cmdline = true; |
| break; |
| case 'c': |
| arg_show_cgroup = true; |
| break; |
| case 'n': |
| r = safe_atoi(optarg, &arg_samples_len); |
| if (r < 0) |
| log_warning_errno(r, "failed to parse --samples/-n argument '%s': %m", |
| optarg); |
| break; |
| case 'o': |
| path_kill_slashes(optarg); |
| strscpy(arg_output_path, sizeof(arg_output_path), optarg); |
| break; |
| case 'i': |
| path_kill_slashes(optarg); |
| strscpy(arg_init_path, sizeof(arg_init_path), optarg); |
| break; |
| case 'p': |
| arg_pss = true; |
| break; |
| case 'x': |
| r = safe_atod(optarg, &arg_scale_x); |
| if (r < 0) |
| log_warning_errno(r, "failed to parse --scale-x/-x argument '%s': %m", |
| optarg); |
| break; |
| case 'y': |
| r = safe_atod(optarg, &arg_scale_y); |
| if (r < 0) |
| log_warning_errno(r, "failed to parse --scale-y/-y argument '%s': %m", |
| optarg); |
| break; |
| case 'e': |
| arg_entropy = true; |
| break; |
| case ARG_PERCPU: |
| arg_percpu = true; |
| break; |
| case 'h': |
| help(); |
| return 0; |
| case '?': |
| if (getpid() != 1) |
| return -EINVAL; |
| else |
| return 0; |
| default: |
| assert_not_reached("Unhandled option code."); |
| } |
| |
| if (arg_hz <= 0) { |
| log_error("Frequency needs to be > 0"); |
| return -EINVAL; |
| } |
| |
| return 1; |
| } |
| |
| static int do_journal_append(char *file) { |
| _cleanup_free_ char *bootchart_message = NULL; |
| _cleanup_free_ char *bootchart_file = NULL; |
| _cleanup_free_ char *p = NULL; |
| _cleanup_close_ int fd = -1; |
| struct iovec iovec[5]; |
| int r, j = 0; |
| ssize_t n; |
| |
| bootchart_file = strappend("BOOTCHART_FILE=", file); |
| if (!bootchart_file) |
| return log_oom(); |
| |
| IOVEC_SET_STRING(iovec[j++], bootchart_file); |
| IOVEC_SET_STRING(iovec[j++], "MESSAGE_ID=9f26aa562cf440c2b16c773d0479b518"); |
| IOVEC_SET_STRING(iovec[j++], "PRIORITY=7"); |
| bootchart_message = strjoin("MESSAGE=Bootchart created: ", file, NULL); |
| if (!bootchart_message) |
| return log_oom(); |
| |
| IOVEC_SET_STRING(iovec[j++], bootchart_message); |
| |
| p = malloc(10 + BOOTCHART_MAX); |
| if (!p) |
| return log_oom(); |
| |
| memcpy(p, "BOOTCHART=", 10); |
| |
| fd = open(file, O_RDONLY|O_CLOEXEC); |
| if (fd < 0) |
| return log_error_errno(errno, "Failed to open bootchart data \"%s\": %m", file); |
| |
| n = loop_read(fd, p + 10, BOOTCHART_MAX, false); |
| if (n < 0) |
| return log_error_errno(n, "Failed to read bootchart data: %m"); |
| |
| iovec[j].iov_base = p; |
| iovec[j].iov_len = 10 + n; |
| j++; |
| |
| r = sd_journal_sendv(iovec, j); |
| if (r < 0) |
| log_error_errno(r, "Failed to send bootchart: %m"); |
| |
| return 0; |
| } |
| |
| int main(int argc, char *argv[]) { |
| static struct list_sample_data *sampledata; |
| _cleanup_closedir_ DIR *proc = NULL; |
| _cleanup_free_ char *build = NULL; |
| _cleanup_fclose_ FILE *of = NULL; |
| _cleanup_close_ int sysfd = -1; |
| struct ps_struct *ps_first; |
| double graph_start; |
| double log_start; |
| double interval; |
| char output_file[PATH_MAX]; |
| char datestr[200]; |
| int pscount = 0; |
| int n_cpus = 0; |
| int overrun = 0; |
| time_t t = 0; |
| int r, samples; |
| struct ps_struct *ps; |
| struct rlimit rlim; |
| struct list_sample_data *head; |
| struct sigaction sig = { |
| .sa_handler = signal_handler, |
| }; |
| |
| parse_conf(); |
| |
| r = parse_argv(argc, argv); |
| if (r < 0) |
| return EXIT_FAILURE; |
| |
| if (r == 0) |
| return EXIT_SUCCESS; |
| |
| /* |
| * If the kernel executed us through init=/usr/lib/systemd/systemd-bootchart, then |
| * fork: |
| * - parent execs executable specified via init_path[] (/usr/lib/systemd/systemd by default) as pid=1 |
| * - child logs data |
| */ |
| if (getpid() == 1) { |
| if (fork()) |
| /* parent */ |
| execl(arg_init_path, arg_init_path, NULL); |
| } |
| argv[0][0] = '@'; |
| |
| rlim.rlim_cur = 4096; |
| rlim.rlim_max = 4096; |
| (void) setrlimit(RLIMIT_NOFILE, &rlim); |
| |
| /* start with empty ps LL */ |
| ps_first = new0(struct ps_struct, 1); |
| if (!ps_first) { |
| log_oom(); |
| return EXIT_FAILURE; |
| } |
| |
| /* handle TERM/INT nicely */ |
| sigaction(SIGHUP, &sig, NULL); |
| |
| interval = (1.0 / arg_hz) * 1000000000.0; |
| |
| if (arg_relative) |
| graph_start = log_start = gettime_ns(); |
| else { |
| struct timespec n; |
| double uptime; |
| |
| clock_gettime(clock_boottime_or_monotonic(), &n); |
| uptime = (n.tv_sec + (n.tv_nsec / (double) NSEC_PER_SEC)); |
| |
| log_start = gettime_ns(); |
| graph_start = log_start - uptime; |
| } |
| |
| if (graph_start < 0.0) { |
| log_error("Failed to setup graph start time.\n\n" |
| "The system uptime probably includes time that the system was suspended. " |
| "Use --rel to bypass this issue."); |
| return EXIT_FAILURE; |
| } |
| |
| LIST_HEAD_INIT(head); |
| |
| /* main program loop */ |
| for (samples = 0; !exiting && samples < arg_samples_len; samples++) { |
| int res; |
| double sample_stop; |
| double elapsed; |
| double timeleft; |
| |
| sampledata = new0(struct list_sample_data, 1); |
| if (sampledata == NULL) { |
| log_oom(); |
| return EXIT_FAILURE; |
| } |
| |
| sampledata->sampletime = gettime_ns(); |
| sampledata->counter = samples; |
| |
| if (sysfd < 0) |
| sysfd = open("/sys", O_RDONLY|O_CLOEXEC); |
| |
| if (!build) { |
| if (parse_env_file("/etc/os-release", NEWLINE, "PRETTY_NAME", &build, NULL) == -ENOENT) |
| parse_env_file("/usr/lib/os-release", NEWLINE, "PRETTY_NAME", &build, NULL); |
| } |
| |
| if (proc) |
| rewinddir(proc); |
| else |
| proc = opendir("/proc"); |
| |
| /* wait for /proc to become available, discarding samples */ |
| if (proc) { |
| r = log_sample(proc, samples, ps_first, &sampledata, &pscount, &n_cpus); |
| if (r < 0) |
| return EXIT_FAILURE; |
| } |
| |
| sample_stop = gettime_ns(); |
| |
| elapsed = (sample_stop - sampledata->sampletime) * 1000000000.0; |
| timeleft = interval - elapsed; |
| |
| /* |
| * check if we have not consumed our entire timeslice. If we |
| * do, don't sleep and take a new sample right away. |
| * we'll lose all the missed samples and overrun our total |
| * time |
| */ |
| if (timeleft > 0) { |
| struct timespec req; |
| |
| req.tv_sec = (time_t)(timeleft / 1000000000.0); |
| req.tv_nsec = (long)(timeleft - (req.tv_sec * 1000000000.0)); |
| |
| res = nanosleep(&req, NULL); |
| if (res) { |
| if (errno == EINTR) |
| /* caught signal, probably HUP! */ |
| break; |
| log_error_errno(errno, "nanosleep() failed: %m"); |
| return EXIT_FAILURE; |
| } |
| } else { |
| overrun++; |
| /* calculate how many samples we lost and scrap them */ |
| arg_samples_len -= (int)(-timeleft / interval); |
| } |
| LIST_PREPEND(link, head, sampledata); |
| } |
| |
| /* do some cleanup, close fd's */ |
| ps = ps_first; |
| while (ps->next_ps) { |
| ps = ps->next_ps; |
| ps->schedstat = safe_close(ps->schedstat); |
| ps->sched = safe_close(ps->sched); |
| ps->smaps = safe_fclose(ps->smaps); |
| } |
| |
| if (!of) { |
| t = time(NULL); |
| r = strftime(datestr, sizeof(datestr), "%Y%m%d-%H%M", localtime(&t)); |
| assert_se(r > 0); |
| |
| snprintf(output_file, PATH_MAX, "%s/bootchart-%s.svg", arg_output_path, datestr); |
| of = fopen(output_file, "we"); |
| } |
| |
| if (!of) { |
| log_error("Error opening output file '%s': %m\n", output_file); |
| return EXIT_FAILURE; |
| } |
| |
| r = svg_do(of, strna(build), head, ps_first, |
| samples, pscount, n_cpus, graph_start, |
| log_start, interval, overrun); |
| |
| if (r < 0) { |
| log_error_errno(r, "Error generating svg file: %m"); |
| return EXIT_FAILURE; |
| } |
| |
| log_info("systemd-bootchart wrote %s\n", output_file); |
| |
| r = do_journal_append(output_file); |
| if (r < 0) |
| return EXIT_FAILURE; |
| |
| /* nitpic cleanups */ |
| ps = ps_first->next_ps; |
| while (ps->next_ps) { |
| struct ps_struct *old; |
| |
| old = ps; |
| old->sample = ps->first; |
| ps = ps->next_ps; |
| while (old->sample->next) { |
| struct ps_sched_struct *oldsample = old->sample; |
| |
| old->sample = old->sample->next; |
| free(oldsample); |
| } |
| free(old->cgroup); |
| free(old->sample); |
| free(old); |
| } |
| |
| free(ps->cgroup); |
| free(ps->sample); |
| free(ps); |
| |
| sampledata = head; |
| while (sampledata->link_prev) { |
| struct list_sample_data *old_sampledata = sampledata; |
| sampledata = sampledata->link_prev; |
| free(old_sampledata); |
| } |
| free(sampledata); |
| |
| /* don't complain when overrun once, happens most commonly on 1st sample */ |
| if (overrun > 1) |
| log_warning("systemd-bootchart: sample time overrun %i times\n", overrun); |
| |
| return 0; |
| } |