From e4bc14b875434c3d5d044ee7b73db0211296f8f3 Mon Sep 17 00:00:00 2001 From: David Wilson Date: Thu, 22 Feb 2018 17:39:50 +0545 Subject: [PATCH] scripts: initial DTrace script. --- scripts/generate_cpu_series.py | 57 +++++++++++++++ scripts/profile_ansible.d | 129 +++++++++++++++++++++++++++++++++ 2 files changed, 186 insertions(+) create mode 100644 scripts/generate_cpu_series.py create mode 100755 scripts/profile_ansible.d diff --git a/scripts/generate_cpu_series.py b/scripts/generate_cpu_series.py new file mode 100644 index 00000000..60cc4764 --- /dev/null +++ b/scripts/generate_cpu_series.py @@ -0,0 +1,57 @@ +#!/usr/bin/env python +# Copyright 2017, David Wilson +# +# Redistribution and use in source and binary forms, with or without +# modification, are permitted provided that the following conditions are met: +# +# 1. Redistributions of source code must retain the above copyright notice, this +# list of conditions and the following disclaimer. +# +# 2. Redistributions in binary form must reproduce the above copyright notice, +# this list of conditions and the following disclaimer in the documentation +# and/or other materials provided with the distribution. +# +# 3. Neither the name of the copyright holder nor the names of its contributors +# may be used to endorse or promote products derived from this software without +# specific prior written permission. +# +# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND +# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED +# WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE +# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE +# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL +# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR +# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER +# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, +# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE +# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + +""" +Read a CSV produced by profile_ansible.d on stdin and produce a 100ms-precision +series of accumulated CPU time on stdout, with floating point second-resolution +timestamps relative to time of first event. +""" + +import collections +import csv +import sys + +nanosec = 1e9 +precision = 1 + +c = collections.Counter() +wall = 0 + +for row in csv.DictReader(sys.stdin): + n = float(row['wall_nsec']) / nanosec + if wall == 0: + wall = n + if row['op'] == 'SCHED': + c[round(n-wall, precision)] += int(row['cpu_nsec']) + +wr = csv.writer(sys.stdout) +wr.writerow(['wall', 'cpu']) +total = 0.0 +for wall, cpu in sorted(c.iteritems()): + total += cpu + wr.writerow((wall, total)) diff --git a/scripts/profile_ansible.d b/scripts/profile_ansible.d new file mode 100755 index 00000000..6973cc0d --- /dev/null +++ b/scripts/profile_ansible.d @@ -0,0 +1,129 @@ +#!/usr/sbin/dtrace -qs + +/* + * Copyright 2017, David Wilson + * + * Redistribution and use in source and binary forms, with or without + * modification, are permitted provided that the following conditions are met: + * + * 1. Redistributions of source code must retain the above copyright notice, this + * list of conditions and the following disclaimer. + * + * 2. Redistributions in binary form must reproduce the above copyright notice, + * this list of conditions and the following disclaimer in the documentation + * and/or other materials provided with the distribution. + * + * 3. Neither the name of the copyright holder nor the names of its contributors + * may be used to endorse or promote products derived from this software without + * specific prior written permission. + * + * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND + * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED + * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE + * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE + * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL + * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR + * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER + * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, + * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE + * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + */ + +/* + * OS X DTrace script to record the CPU time consumed by any python2.7 or SSH + * process, and the exact read/write sizes to any AF_INET socket opened by an + * SSH process. + * + * This introduces significant tracing overhead of between 5-10%, most likely + * due to the SCHED events. + * + * Produces a CSV file containing columns: + * - wall_nsec: Nanoseconds wall time. + * - op: One of START, SCHED, EXIT, READ, WRITE + * - nbytes: for READ/WRITE, size of AF_INET data read/written + * - cpu_nsec: for SCHED, nanoseconds spent scheduled. + * - pid: Process ID. + * - execname: argv[0] + * + * Operations: + * - START: thread relevant to the trace started up. + * - EXIT: thread relevant to the trace ended, cpu_nsec contains total + * time scheduled + * - SCHED: thread relevant to the trace was scheduled, cpu_nsec contains + * time spent before it went off-cpu again. + * - READ: SSH process performed a nbytes read from an AF_INET socket. + * - WRITE: SSH process performed a nbytes write to an AF_INET socket. + */ + +inline string SSH = "ssh"; +inline string PYTHON = "python2.7"; +inline int PF_INET = 2; + +dtrace:::BEGIN +{ + printf("wall_nsec,op,nbytes,cpu_nsec,pid,execname\n"); +} + +syscall::socket:entry +/execname == SSH && arg0 == PF_INET/ +{ + self->is_inet = 1; +} + +syscall::socket:return +/self->is_inet/ +{ + self->inet_fds[arg0] = 1; +} + +syscall::write*:entry +/self->inet_fds[arg0]/ +{ + self->write_fd = arg0; + self->write_nbyte = arg2; +} + +syscall::write*:return +/self->write_fd && arg0 > 0/ +{ + printf("%d,WRITE,%d,,,\n", walltimestamp, arg0); +} + +syscall::read*:entry +/self->inet_fds[arg0]/ +{ + self->read_fd = arg0; +} + +syscall::read*:return +/self->read_fd && arg0 > 0/ +{ + printf("%d,READ,%d,,,\n", walltimestamp, arg0); +} + +proc:::lwp-start +/execname == SSH || execname == PYTHON/ +{ + self->start_vtime = vtimestamp; + printf("%d,START,,,%d,%s\n", walltimestamp, pid, execname); +} + +proc:::lwp-exit +/(execname == SSH || execname == PYTHON) && self->start_vtime/ +{ + this->nsecs = vtimestamp - self->start_vtime; + printf("%d,EXIT,,%d,%d,%s\n", walltimestamp, this->nsecs, pid, execname); +} + +sched:::on-cpu +/self->start_vtime/ +{ + self->ontime = vtimestamp; +} + +sched:::off-cpu +/self->ontime/ +{ + this->spent = vtimestamp - self->ontime; + printf("%d,SCHED,,%d,%d,%s\n", walltimestamp, this->spent, pid, execname); +}