Context Navigation

source: memlog_analyze @ c83befc

Revision c83befc, 10.9 KB checked in by Hal Finkel <hfinkel@…>, 9 years ago (diff)
make the output dir if it does not exist
Property mode set to `100755`

Line
1	#! /usr/bin/env perl
2	use strict;
3	use File::Basename;
4	use File::Path qw(make_path);
5	use Getopt::Long;
6
7	my $find_leaks = 0;
8	my $print_raw_proc_name = 0;
9	my $quiet = 0;
10	my $help = 0;
11
12	sub print_usage($) {
13	my $ec = $_[0];
14	my $usage = <<EOM;
15	Usage: $0 [options] <memlog file or glob> [<output directory>]
16	options:
17	--leaks
18	Provide information on leaks instead of peak usage
19	--print-symbol-names
20	Include symbol names and offsets in the output
21	--quiet or -q
22	Don't print status messages while running
23	EOM
24
25	print $usage;
26	exit($ec);
27	}
28
29	GetOptions("help\|h\|?" => \$help,
30	"leaks" => \$find_leaks,
31	"print-symbol-names" => \$print_raw_proc_name,
32	"quiet\|q" => \$quiet)
33	or print_usage(1);
34
35	if ($help) {
36	print_usage(0);
37	}
38
39	if (scalar(@ARGV) > 2) {
40	print_usage(2);
41	}
42
43	my $memlog_fn = $ARGV[0];
44	my $out_dir = $ARGV[1] \|\| '.';
45
46	make_path($out_dir);
47
48	if (! -f $memlog_fn) {
49	my @pot_fns = glob($memlog_fn);
50	if (scalar(@pot_fns)) {
51	if (!$quiet) {
52	print "Searching all files matching '$memlog_fn'\n";
53	}
54
55	my $pot_max_rss = 0;
56	my $pos_max_rss_fn;
57	foreach my $pot_fn (@pot_fns) {
58	my $last_line = `tail -n 1 '$pot_fn'`;
59	chomp($last_line);
60
61	my @parts = split(/\t/, $last_line);
62
63	my $op = shift(@parts);
64	my $state = shift(@parts);
65
66	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
67	if ($pot_max_rss < $then_max_rss) {
68	$pot_max_rss = $then_max_rss;
69	$pos_max_rss_fn = $pot_fn;
70	}
71	}
72
73	if (defined $pos_max_rss_fn) {
74	$memlog_fn = $pos_max_rss_fn;
75	goto have_memlog_fn;
76	}
77	}
78
79	print_usage(1);
80	}
81	have_memlog_fn:
82
83	# The version of addr2line and friends that you use can make a big difference,
84	# especially on BE ppc64, where older versions of addr2line did not account
85	# correctly for the function descriptor setup. At ALCF, on the BG/Q, we have
86	# newer versions not in the default search path (from bgclang).
87	my $alcf_bu_dir = '/soft/compilers/bgclang/current/binutils/bin';
88	if (-d $alcf_bu_dir) {
89	$ENV{'PATH'} = $alcf_bu_dir . ':' . $ENV{'PATH'};
90	}
91
92	open(MEMLOG, $memlog_fn) \|\| die "Can't open $memlog_fn: $!";
93
94	# The first step is to determine the high-water mark.
95	my $max_rss = 0;
96	foreach my $line (<MEMLOG>) {
97	chomp($line);
98	my @parts = split(/\t/, $line);
99
100	my $op = shift(@parts);
101	my $state = shift(@parts);
102
103	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
104	if ($max_rss < $then_max_rss) {
105	$max_rss = $then_max_rss;
106	}
107	}
108
109	seek(MEMLOG, 0, 0);
110
111	# Scan the log for malloc/free pairings. We're interested only in active
112	# allocations at the time when the rss reaches the final maxrss.
113	# If we're finding leaks, then go to the very end.
114	my $active_alloc_time = 0;
115	my %malloc_lines;
116	foreach my $line (<MEMLOG>) {
117	chomp($line);
118	my @parts = split(/\t/, $line);
119
120	my $op = shift(@parts);
121	my $state = shift(@parts);
122
123	if ($op =~ /^M:/) {
124	my ($size, $ptr) = ($op =~ /^M: (\d+) 0x(\w+)/);
125	$malloc_lines{$ptr} = $line;
126	} elsif ($op =~ /^F:/) {
127	my ($ptr) = ($op =~ /^F: 0x(\w+)/);
128	delete $malloc_lines{$ptr};
129	} else {
130	next;
131	}
132
133	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
134	$active_alloc_time = $time;
135
136	if (!$find_leaks) {
137	# If we've reached the max rss, we've seen all we need to see.
138	if ($then_max_rss == $max_rss) {
139	last;
140	}
141	}
142	}
143
144	close(MEMLOG);
145
146	# Convert maxrss, currently in KB, to bytes.
147	$max_rss *= 1024;
148
149	my $total_size = 0;
150	my %roots;
151	my %all_nodes;
152	foreach my $line (values %malloc_lines) {
153	my @parts = split(/\t/, $line);
154
155	my $op = shift(@parts);
156	my $state = shift(@parts);
157
158	# Only dealing with allocations here...
159	if ($op !~ /^M:/) {
160	next;
161	}
162
163	my ($size, $ptr) = ($op =~ /^M: (\d+) 0x(\w+)/);
164	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
165
166	$total_size += $size;
167
168	sub level_parts($) {
169	my $level = @_[0];
170	my ($file_name, $proc_name, $off, $pc, $relpc) =
171	($level =~ /^(.) \((.)\+0x(\w+)\) \[0x(\w+) \(0x(\w+)\)\]/);
172
173	return ($file_name, $proc_name, $off, $pc, $relpc);
174	}
175
176	# Put the top of the stack first.
177	@parts = reverse(@parts);
178
179	my $parent = \%roots;
180	for (my $i = 0; $i < scalar(@parts); ++$i) {
181	my $level = $parts[$i];
182	my ($file_name, $proc_name, $off, $pc, $relpc) = level_parts($level);
183
184	# Skip this level if we don't even know from what file it came.
185	if ($file_name eq '?') {
186	next;
187	}
188
189	# print STDERR "parsed: $file_name, $proc_name, $off, $pc, $relpc\n";
190
191	if (!exists $all_nodes{$pc}) {
192	$all_nodes{$pc}->{'file_name'} = $file_name;
193	$all_nodes{$pc}->{'proc_name'} = $proc_name;
194	$all_nodes{$pc}->{'off'} = $off;
195	$all_nodes{$pc}->{'pc'} = $pc;
196	$all_nodes{$pc}->{'relpc'} = $relpc;
197	}
198
199	if (!exists $parent->{$pc}) {
200	$parent->{$pc} = $all_nodes{$pc};
201	}
202
203	$parent->{$pc}->{'size'} += $size;
204
205	my ($next_file_name, $next_proc_name, $next_off, $next_pc, $next_relpc);
206	if ($i < scalar(@parts)-1) {
207	my $next_level = $parts[$i+1];
208	($next_file_name, $next_proc_name, $next_off, $next_pc, $next_relpc) =
209	level_parts($next_level);
210	$parent->{$pc}->{'child_sizes'}->{$next_pc} += $size;
211	}
212
213	if (!exists $parent->{'children'}) {
214	$parent->{'children'} = {};
215	}
216
217	$parent = $parent->{'children'};
218	}
219	}
220
221	my $txt_fn = "$out_dir/" . basename($memlog_fn) . ".txt";
222	my $dot_fn = "$out_dir/" . basename($memlog_fn) . ".dot";
223	my $ps_fn = "$out_dir/" . basename($memlog_fn) . ".ps";
224	my $pdf_fn = "$out_dir/" . basename($memlog_fn) . ".pdf";
225
226	if (!$quiet) {
227	print "Creating $txt_fn\n";
228	}
229
230	open(TXT, ">$txt_fn") \|\| die "Can't open $txt_fn: $!";
231
232	if (!$quiet) {
233	print "Creating $dot_fn\n";
234	}
235
236	open(DOT, ">$dot_fn") \|\| die "Can't open $dot_fn: $!";
237
238	sub format_bytes($) {
239	my @sizes = qw( B KB MB GB TB PB );
240	my $size = $_[0];
241
242	my $i = 0;
243	while ($size > 1024) {
244	$size /= 1024;
245	++$i;
246	}
247
248	return sprintf("%.3f $sizes[$i]", $size);
249	}
250
251	print DOT ("digraph \"memlog\" {\n");
252	print DOT ("size=\"8,11\";\n");
253	print DOT ("node [width=0.375,height=0.25];\n");
254
255	my $find_type = $find_leaks ? " (leaks)" : "";
256	printf DOT ("Legend [shape=box, fontsize=100, shape=oval," .
257	"label=\"Total: %s active$find_type at maxrss = %s after %s s\"];\n",
258	format_bytes($total_size), format_bytes($max_rss),
259	$active_alloc_time);
260
261	printf TXT ("memlog: Total: %s active$find_type at maxrss = %s after %s s\n\n",
262	format_bytes($total_size), format_bytes($max_rss),
263	$active_alloc_time);
264
265	my %cached_names;
266	sub get_name($) {
267	my $node = $_[0];
268	my $pc = $node->{'pc'};
269
270	if (exists $cached_names{$pc}) {
271	return $cached_names{$pc};
272	}
273
274	my $ret = '';
275
276	# Prefer the relative offset (that is what we want for shared libraries), but
277	# if is not available, use the full offset (which is what we want for the
278	# base executable).
279	my $exe_off = $node->{'relpc'};
280	if (!$exe_off) {
281	$exe_off = $pc;
282	}
283
284	my $file_name = $node->{'file_name'};
285
286	# If we don't have an absolute path, this is probably the base dynamic
287	# executable, so ask the shell which one it used (not foolproof because we
288	# might not have the same PATH now, but hopefully is generally the right
289	# thing).
290	if ($file_name !~ /^\//) {
291	$file_name = `which '$file_name'`;
292	chomp($file_name);
293	}
294
295	my ($func, $loc) = `addr2line -e '$file_name' -f 0x$exe_off`;
296	chomp($func);
297	chomp($loc);
298
299	if ($func !~ /^\?/) {
300	# In general, this function name might look something like:
301	# 00000329.plt_call.wcsnrtombs@@GLIBC_2.3+0
302	$func =~ s/@.*//; # Remove trailing symbol version strings
303	$func =~ s/.*\.//;
304	$func = `c++filt '$func'`;
305	chomp($func);
306
307	# It sometimes happens that addr2line is a bit too smart: when debugging
308	# information is available, it might print a local alias for the
309	# function instead of the full name (for example, printing 'List'
310	# instead of 'Foo::List<int>::List(int, int const&)').
311	if ($node->{'proc_name'} ne '?') {
312	my $proc_name = $node->{'proc_name'};
313	$proc_name = `c++filt '$proc_name'`;
314	chomp($proc_name);
315
316	if (length($proc_name) > length($func)) {
317	$func = $proc_name;
318	}
319	}
320
321	$ret .= $func . '\n';
322
323	if ($loc !~ /^[:?]/) {
324	$ret .= $loc . '\n';
325	}
326	} elsif ($node->{'proc_name'} ne '?') {
327	my $proc_name = $node->{'proc_name'};
328	$proc_name = `c++filt '$proc_name'`;
329	chomp($proc_name);
330
331	$ret .= $proc_name . '\n';
332	}
333
334	$ret .= $node->{'file_name'};
335	if ($print_raw_proc_name and $node->{'proc_name'} ne '?') {
336	$ret .= '\n' . $node->{'proc_name'} . '+0x' . $node->{'off'};
337	}
338
339	$cached_names{$pc} = $ret;
340	return $ret;
341	}
342
343	my $skip_frac = 0.01;
344	my %skipped;
345
346	foreach my $pc (keys %all_nodes) {
347	my $node = $all_nodes{$pc};
348
349	my $local_size = $node->{'size'};
350	if ($local_size * 1.0 / $total_size < $skip_frac) {
351	$skipped{$pc} = 1;
352	next;
353	}
354
355	my $fs = 8.0;
356	if ($local_size > 0) {
357	$fs = 50.0 * (abs($local_size * 1.0 / $total_size))**0.125;
358	}
359
360	my $name = get_name($node);
361
362	printf DOT ("N%s [label=\"%s\\n%s\", shape=box, fontsize=%.1f%s];\n",
363	$pc, $name, format_bytes($local_size), $fs);
364	}
365
366	foreach my $pc (keys %all_nodes) {
367	if ($skipped{$pc}) {
368	next;
369	}
370
371	my $node = $all_nodes{$pc};
372	my $local_size = $node->{'size'};
373
374	foreach my $cpc (keys %{$node->{'child_sizes'}}) {
375	if ($skipped{$cpc}) {
376	next;
377	}
378
379	my $child_size = $node->{'child_sizes'}->{$cpc};
380	my $frac = $child_size * 1.0 / $local_size;
381
382	my $weight = 100.0 * sqrt($frac);
383	my $style = sprintf("setlinewidth(%f)", 8.0 * sqrt($frac));
384
385	my $fs = 40.0 * $frac**0.125;
386
387	printf DOT ("N%s -> N%s [label=\"%s\", weight=%d, style=\"%s\", fontsize=%.1f];\n",
388	$pc, $cpc, format_bytes($child_size), $weight, $style, $fs);
389	}
390	}
391
392	print DOT ("}\n");
393
394	foreach my $pc (sort { $all_nodes{$::b}->{'size'} <=>
395	$all_nodes{$::a}->{'size'} } keys %all_nodes) {
396	if ($skipped{$pc}) {
397	next;
398	}
399
400	print TXT ('*' x 80) . "\n\n";
401
402	my $node = $all_nodes{$pc};
403
404	my $local_size = $node->{'size'};
405	printf TXT ("%s - %.1f%%\n", format_bytes($local_size),
406	$local_size * 100.0 / $total_size);
407
408	my $name = get_name($node);
409	$name =~ s/\\n/\n/g;
410
411	print TXT "$name\n$pc\n";
412
413	print TXT "\nMEMORY ALLOCATED BY CALLEES:\n";
414
415	foreach my $cpc (sort { $node->{'child_sizes'}->{$::b} <=>
416	$node->{'child_sizes'}->{$::a} }
417	keys %{$node->{'child_sizes'}}) {
418	if ($skipped{$cpc}) {
419	next;
420	}
421
422	my $child_node = $all_nodes{$cpc};
423	my $child_size = $node->{'child_sizes'}->{$cpc};
424
425	printf TXT ("\t%s - %.1f%%\n", format_bytes($child_size),
426	$child_size * 100.0 / $local_size);
427
428	my $child_name = get_name($child_node);
429	$child_name =~ s/\\n/\n\t/g;
430	print TXT "\t$child_name\n\t$cpc\n";
431
432	print TXT "\n";
433	}
434
435	print TXT "\n";
436	}
437
438	close(TXT);
439	close(DOT);
440
441	if (!$quiet) {
442	print "Creating $ps_fn\n";
443	}
444
445	system("dot -Tps2 < '$dot_fn' > '$ps_fn'");
446
447	if (!$quiet) {
448	print "Creating $pdf_fn\n";
449	}
450
451	system("ps2pdf '$ps_fn' '$pdf_fn'");
452
453	exit 0;
454

Note: See TracBrowser for help on using the repository browser.

Download in other formats: