diff options
author | Tony Jones <tonyj@suse.com> | 2015-08-17 15:48:52 -0400 |
---|---|---|
committer | Arnaldo Carvalho de Melo <acme@redhat.com> | 2015-08-28 13:53:40 -0400 |
commit | 84e5d89a777cca26cc513264752b439874702dd6 (patch) | |
tree | 4ac2209d0622579f405925b20d2a38dc79b6dc6d /tools/perf/scripts/python/compaction-times.py | |
parent | 1d945012d1381f0232ea2d66e32b06182eedb476 (diff) |
perf scripts python: Add new compaction-times script
This patch creates a new script (compaction-times) to report time
spent in mm compaction. It is possible to report times in nanoseconds
(default) or microseconds (-u).
The option -p will break down results by process id, -pv will further
decompose by each compaction entry/exit.
For each compaction entry/exit what is reported is controlled by the
options:
-t report only timing
-m report migration stats
-ms report migration scanner stats
-fs report free scanner stats
The default is to report all.
Entries may be further filtered by pid, pid-range or comm (regex).
The script is useful when analysing workloads that compact memory. The
most common example will be THP allocations on systems with a lot of
uptime that has fragmented memory.
This is an example of using the script to analyse a thpscale from
mmtests which deliberately fragments memory and allocates THP in 4
separate threads
# Recording step, one of the following;
$ perf record -e 'compaction:mm_compaction_*' ./workload
# or:
$ perf script record compaction-times
# Reporting: basic
total: 2444505743ns migration: moved=357738 failed=39275
free_scanner: scanned=2705578 isolated=387875
migration_scanner: scanned=414426 isolated=397013
# Reporting: Per task stall times
$ perf script report compaction-times -- -t -p
total: 2444505743ns
6384[thpscale]: 740800017ns
6385[thpscale]: 274119512ns
6386[thpscale]: 832961337ns
6383[thpscale]: 596624877ns
# Reporting: Per-compaction attempts for task 6385
$ perf script report compaction-times -- -m -pv 6385
total: 274119512ns migration: moved=14893 failed=24285
6385[thpscale]: 274119512ns migration: moved=14893 failed=24285
6385[thpscale].1: 3033277ns migration: moved=511 failed=1
6385[thpscale].2: 9592094ns migration: moved=1524 failed=12
6385[thpscale].3: 2495587ns migration: moved=512 failed=0
6385[thpscale].4: 2561766ns migration: moved=512 failed=0
6385[thpscale].5: 2523521ns migration: moved=512 failed=0
..... output continues ...
Changes since v1:
- report stats for isolate_migratepages and isolate_freepages
(Vlastimil Babka)
- refactor code to achieve above
- add help text
- output to stdout/stderr explicitly
Signed-off-by: Tony Jones <tonyj@suse.com>
Cc: Mel Gorman <mgorman@suse.com>
Cc: Vlastimil Babka <vbabka@suse.cz>
Link: http://lkml.kernel.org/r/1439840932-8933-1-git-send-email-tonyj@suse.com
Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
Diffstat (limited to 'tools/perf/scripts/python/compaction-times.py')
-rw-r--r-- | tools/perf/scripts/python/compaction-times.py | 311 |
1 files changed, 311 insertions, 0 deletions
diff --git a/tools/perf/scripts/python/compaction-times.py b/tools/perf/scripts/python/compaction-times.py new file mode 100644 index 000000000000..239cb0568ec3 --- /dev/null +++ b/tools/perf/scripts/python/compaction-times.py | |||
@@ -0,0 +1,311 @@ | |||
1 | # report time spent in compaction | ||
2 | # Licensed under the terms of the GNU GPL License version 2 | ||
3 | |||
4 | # testing: | ||
5 | # 'echo 1 > /proc/sys/vm/compact_memory' to force compaction of all zones | ||
6 | |||
7 | import os | ||
8 | import sys | ||
9 | import re | ||
10 | |||
11 | import signal | ||
12 | signal.signal(signal.SIGPIPE, signal.SIG_DFL) | ||
13 | |||
14 | usage = "usage: perf script report compaction-times.py -- [-h] [-u] [-p|-pv] [-t | [-m] [-fs] [-ms]] [pid|pid-range|comm-regex]\n" | ||
15 | |||
16 | class popt: | ||
17 | DISP_DFL = 0 | ||
18 | DISP_PROC = 1 | ||
19 | DISP_PROC_VERBOSE=2 | ||
20 | |||
21 | class topt: | ||
22 | DISP_TIME = 0 | ||
23 | DISP_MIG = 1 | ||
24 | DISP_ISOLFREE = 2 | ||
25 | DISP_ISOLMIG = 4 | ||
26 | DISP_ALL = 7 | ||
27 | |||
28 | class comm_filter: | ||
29 | def __init__(self, re): | ||
30 | self.re = re | ||
31 | |||
32 | def filter(self, pid, comm): | ||
33 | m = self.re.search(comm) | ||
34 | return m == None or m.group() == "" | ||
35 | |||
36 | class pid_filter: | ||
37 | def __init__(self, low, high): | ||
38 | self.low = (0 if low == "" else int(low)) | ||
39 | self.high = (0 if high == "" else int(high)) | ||
40 | |||
41 | def filter(self, pid, comm): | ||
42 | return not (pid >= self.low and (self.high == 0 or pid <= self.high)) | ||
43 | |||
44 | def set_type(t): | ||
45 | global opt_disp | ||
46 | opt_disp = (t if opt_disp == topt.DISP_ALL else opt_disp|t) | ||
47 | |||
48 | def ns(sec, nsec): | ||
49 | return (sec * 1000000000) + nsec | ||
50 | |||
51 | def time(ns): | ||
52 | return "%dns" % ns if opt_ns else "%dus" % (round(ns, -3) / 1000) | ||
53 | |||
54 | class pair: | ||
55 | def __init__(self, aval, bval, alabel = None, blabel = None): | ||
56 | self.alabel = alabel | ||
57 | self.blabel = blabel | ||
58 | self.aval = aval | ||
59 | self.bval = bval | ||
60 | |||
61 | def __add__(self, rhs): | ||
62 | self.aval += rhs.aval | ||
63 | self.bval += rhs.bval | ||
64 | return self | ||
65 | |||
66 | def __str__(self): | ||
67 | return "%s=%d %s=%d" % (self.alabel, self.aval, self.blabel, self.bval) | ||
68 | |||
69 | class cnode: | ||
70 | def __init__(self, ns): | ||
71 | self.ns = ns | ||
72 | self.migrated = pair(0, 0, "moved", "failed") | ||
73 | self.fscan = pair(0,0, "scanned", "isolated") | ||
74 | self.mscan = pair(0,0, "scanned", "isolated") | ||
75 | |||
76 | def __add__(self, rhs): | ||
77 | self.ns += rhs.ns | ||
78 | self.migrated += rhs.migrated | ||
79 | self.fscan += rhs.fscan | ||
80 | self.mscan += rhs.mscan | ||
81 | return self | ||
82 | |||
83 | def __str__(self): | ||
84 | prev = 0 | ||
85 | s = "%s " % time(self.ns) | ||
86 | if (opt_disp & topt.DISP_MIG): | ||
87 | s += "migration: %s" % self.migrated | ||
88 | prev = 1 | ||
89 | if (opt_disp & topt.DISP_ISOLFREE): | ||
90 | s += "%sfree_scanner: %s" % (" " if prev else "", self.fscan) | ||
91 | prev = 1 | ||
92 | if (opt_disp & topt.DISP_ISOLMIG): | ||
93 | s += "%smigration_scanner: %s" % (" " if prev else "", self.mscan) | ||
94 | return s | ||
95 | |||
96 | def complete(self, secs, nsecs): | ||
97 | self.ns = ns(secs, nsecs) - self.ns | ||
98 | |||
99 | def increment(self, migrated, fscan, mscan): | ||
100 | if (migrated != None): | ||
101 | self.migrated += migrated | ||
102 | if (fscan != None): | ||
103 | self.fscan += fscan | ||
104 | if (mscan != None): | ||
105 | self.mscan += mscan | ||
106 | |||
107 | |||
108 | class chead: | ||
109 | heads = {} | ||
110 | val = cnode(0); | ||
111 | fobj = None | ||
112 | |||
113 | @classmethod | ||
114 | def add_filter(cls, filter): | ||
115 | cls.fobj = filter | ||
116 | |||
117 | @classmethod | ||
118 | def create_pending(cls, pid, comm, start_secs, start_nsecs): | ||
119 | filtered = 0 | ||
120 | try: | ||
121 | head = cls.heads[pid] | ||
122 | filtered = head.is_filtered() | ||
123 | except KeyError: | ||
124 | if cls.fobj != None: | ||
125 | filtered = cls.fobj.filter(pid, comm) | ||
126 | head = cls.heads[pid] = chead(comm, pid, filtered) | ||
127 | |||
128 | if not filtered: | ||
129 | head.mark_pending(start_secs, start_nsecs) | ||
130 | |||
131 | @classmethod | ||
132 | def increment_pending(cls, pid, migrated, fscan, mscan): | ||
133 | head = cls.heads[pid] | ||
134 | if not head.is_filtered(): | ||
135 | if head.is_pending(): | ||
136 | head.do_increment(migrated, fscan, mscan) | ||
137 | else: | ||
138 | sys.stderr.write("missing start compaction event for pid %d\n" % pid) | ||
139 | |||
140 | @classmethod | ||
141 | def complete_pending(cls, pid, secs, nsecs): | ||
142 | head = cls.heads[pid] | ||
143 | if not head.is_filtered(): | ||
144 | if head.is_pending(): | ||
145 | head.make_complete(secs, nsecs) | ||
146 | else: | ||
147 | sys.stderr.write("missing start compaction event for pid %d\n" % pid) | ||
148 | |||
149 | @classmethod | ||
150 | def gen(cls): | ||
151 | if opt_proc != popt.DISP_DFL: | ||
152 | for i in cls.heads: | ||
153 | yield cls.heads[i] | ||
154 | |||
155 | @classmethod | ||
156 | def str(cls): | ||
157 | return cls.val | ||
158 | |||
159 | def __init__(self, comm, pid, filtered): | ||
160 | self.comm = comm | ||
161 | self.pid = pid | ||
162 | self.val = cnode(0) | ||
163 | self.pending = None | ||
164 | self.filtered = filtered | ||
165 | self.list = [] | ||
166 | |||
167 | def __add__(self, rhs): | ||
168 | self.ns += rhs.ns | ||
169 | self.val += rhs.val | ||
170 | return self | ||
171 | |||
172 | def mark_pending(self, secs, nsecs): | ||
173 | self.pending = cnode(ns(secs, nsecs)) | ||
174 | |||
175 | def do_increment(self, migrated, fscan, mscan): | ||
176 | self.pending.increment(migrated, fscan, mscan) | ||
177 | |||
178 | def make_complete(self, secs, nsecs): | ||
179 | self.pending.complete(secs, nsecs) | ||
180 | chead.val += self.pending | ||
181 | |||
182 | if opt_proc != popt.DISP_DFL: | ||
183 | self.val += self.pending | ||
184 | |||
185 | if opt_proc == popt.DISP_PROC_VERBOSE: | ||
186 | self.list.append(self.pending) | ||
187 | self.pending = None | ||
188 | |||
189 | def enumerate(self): | ||
190 | if opt_proc == popt.DISP_PROC_VERBOSE and not self.is_filtered(): | ||
191 | for i, pelem in enumerate(self.list): | ||
192 | sys.stdout.write("%d[%s].%d: %s\n" % (self.pid, self.comm, i+1, pelem)) | ||
193 | |||
194 | def is_pending(self): | ||
195 | return self.pending != None | ||
196 | |||
197 | def is_filtered(self): | ||
198 | return self.filtered | ||
199 | |||
200 | def display(self): | ||
201 | if not self.is_filtered(): | ||
202 | sys.stdout.write("%d[%s]: %s\n" % (self.pid, self.comm, self.val)) | ||
203 | |||
204 | |||
205 | def trace_end(): | ||
206 | sys.stdout.write("total: %s\n" % chead.str()) | ||
207 | for i in chead.gen(): | ||
208 | i.display(), | ||
209 | i.enumerate() | ||
210 | |||
211 | def compaction__mm_compaction_migratepages(event_name, context, common_cpu, | ||
212 | common_secs, common_nsecs, common_pid, common_comm, | ||
213 | common_callchain, nr_migrated, nr_failed): | ||
214 | |||
215 | chead.increment_pending(common_pid, | ||
216 | pair(nr_migrated, nr_failed), None, None) | ||
217 | |||
218 | def compaction__mm_compaction_isolate_freepages(event_name, context, common_cpu, | ||
219 | common_secs, common_nsecs, common_pid, common_comm, | ||
220 | common_callchain, start_pfn, end_pfn, nr_scanned, nr_taken): | ||
221 | |||
222 | chead.increment_pending(common_pid, | ||
223 | None, pair(nr_scanned, nr_taken), None) | ||
224 | |||
225 | def compaction__mm_compaction_isolate_migratepages(event_name, context, common_cpu, | ||
226 | common_secs, common_nsecs, common_pid, common_comm, | ||
227 | common_callchain, start_pfn, end_pfn, nr_scanned, nr_taken): | ||
228 | |||
229 | chead.increment_pending(common_pid, | ||
230 | None, None, pair(nr_scanned, nr_taken)) | ||
231 | |||
232 | def compaction__mm_compaction_end(event_name, context, common_cpu, | ||
233 | common_secs, common_nsecs, common_pid, common_comm, | ||
234 | common_callchain, zone_start, migrate_start, free_start, zone_end, | ||
235 | sync, status): | ||
236 | |||
237 | chead.complete_pending(common_pid, common_secs, common_nsecs) | ||
238 | |||
239 | def compaction__mm_compaction_begin(event_name, context, common_cpu, | ||
240 | common_secs, common_nsecs, common_pid, common_comm, | ||
241 | common_callchain, zone_start, migrate_start, free_start, zone_end, | ||
242 | sync): | ||
243 | |||
244 | chead.create_pending(common_pid, common_comm, common_secs, common_nsecs) | ||
245 | |||
246 | def pr_help(): | ||
247 | global usage | ||
248 | |||
249 | sys.stdout.write(usage) | ||
250 | sys.stdout.write("\n") | ||
251 | sys.stdout.write("-h display this help\n") | ||
252 | sys.stdout.write("-p display by process\n") | ||
253 | sys.stdout.write("-pv display by process (verbose)\n") | ||
254 | sys.stdout.write("-t display stall times only\n") | ||
255 | sys.stdout.write("-m display stats for migration\n") | ||
256 | sys.stdout.write("-fs display stats for free scanner\n") | ||
257 | sys.stdout.write("-ms display stats for migration scanner\n") | ||
258 | sys.stdout.write("-u display results in microseconds (default nanoseconds)\n") | ||
259 | |||
260 | |||
261 | comm_re = None | ||
262 | pid_re = None | ||
263 | pid_regex = "^(\d*)-(\d*)$|^(\d*)$" | ||
264 | |||
265 | opt_proc = popt.DISP_DFL | ||
266 | opt_disp = topt.DISP_ALL | ||
267 | |||
268 | opt_ns = True | ||
269 | |||
270 | argc = len(sys.argv) - 1 | ||
271 | if argc >= 1: | ||
272 | pid_re = re.compile(pid_regex) | ||
273 | |||
274 | for i, opt in enumerate(sys.argv[1:]): | ||
275 | if opt[0] == "-": | ||
276 | if opt == "-h": | ||
277 | pr_help() | ||
278 | exit(0); | ||
279 | elif opt == "-p": | ||
280 | opt_proc = popt.DISP_PROC | ||
281 | elif opt == "-pv": | ||
282 | opt_proc = popt.DISP_PROC_VERBOSE | ||
283 | elif opt == '-u': | ||
284 | opt_ns = False | ||
285 | elif opt == "-t": | ||
286 | set_type(topt.DISP_TIME) | ||
287 | elif opt == "-m": | ||
288 | set_type(topt.DISP_MIG) | ||
289 | elif opt == "-fs": | ||
290 | set_type(topt.DISP_ISOLFREE) | ||
291 | elif opt == "-ms": | ||
292 | set_type(topt.DISP_ISOLMIG) | ||
293 | else: | ||
294 | sys.exit(usage) | ||
295 | |||
296 | elif i == argc - 1: | ||
297 | m = pid_re.search(opt) | ||
298 | if m != None and m.group() != "": | ||
299 | if m.group(3) != None: | ||
300 | f = pid_filter(m.group(3), m.group(3)) | ||
301 | else: | ||
302 | f = pid_filter(m.group(1), m.group(2)) | ||
303 | else: | ||
304 | try: | ||
305 | comm_re=re.compile(opt) | ||
306 | except: | ||
307 | sys.stderr.write("invalid regex '%s'" % opt) | ||
308 | sys.exit(usage) | ||
309 | f = comm_filter(comm_re) | ||
310 | |||
311 | chead.add_filter(f) | ||