Context Navigation

source: memlog_analyze @ d270799

Revision d270799, 10.9 KB checked in by Hal Finkel <hfinkel@…>, 10 years ago (diff)
don't accept too many command-line parameters
Property mode set to `100755`

Line
1	#! /usr/bin/env perl
2	use strict;
3	use File::Basename;
4	use Getopt::Long;
5
6	my $find_leaks = 0;
7	my $print_raw_proc_name = 0;
8	my $quiet = 0;
9	my $help = 0;
10
11	sub print_usage($) {
12	my $ec = $_[0];
13	my $usage = <<EOM;
14	Usage: $0 [options] <memlog file or glob> [<output directory>]
15	options:
16	--leaks
17	Provide information on leaks instead of peak usage
18	--print-symbol-names
19	Include symbol names and offsets in the output
20	--quiet or -q
21	Don't print status messages while running
22	EOM
23
24	print $usage;
25	exit($ec);
26	}
27
28	GetOptions("help\|h\|?" => \$help,
29	"leaks" => \$find_leaks,
30	"print-symbol-names" => \$print_raw_proc_name,
31	"quiet\|q" => \$quiet)
32	or print_usage(1);
33
34	if ($help) {
35	print_usage(0);
36	}
37
38	if (scalar(@ARGV) > 1) {
39	print_usage(2);
40	}
41
42	my $memlog_fn = $ARGV[0];
43	my $out_dir = $ARGV[1] \|\| '.';
44
45	if (! -f $memlog_fn) {
46	my @pot_fns = glob($memlog_fn);
47	if (scalar(@pot_fns)) {
48	if (!$quiet) {
49	print "Searching all files matching '$memlog_fn'\n";
50	}
51
52	my $pot_max_rss = 0;
53	my $pos_max_rss_fn;
54	foreach my $pot_fn (@pot_fns) {
55	my $last_line = `tail -n 1 '$pot_fn'`;
56	chomp($last_line);
57
58	my @parts = split(/\t/, $last_line);
59
60	my $op = shift(@parts);
61	my $state = shift(@parts);
62
63	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
64	if ($pot_max_rss < $then_max_rss) {
65	$pot_max_rss = $then_max_rss;
66	$pos_max_rss_fn = $pot_fn;
67	}
68	}
69
70	if (defined $pos_max_rss_fn) {
71	$memlog_fn = $pos_max_rss_fn;
72	goto have_memlog_fn;
73	}
74	}
75
76	print_usage(1);
77	}
78	have_memlog_fn:
79
80	# The version of addr2line and friends that you use can make a big difference,
81	# especially on BE ppc64, where older versions of addr2line did not account
82	# correctly for the function descriptor setup. At ALCF, on the BG/Q, we have
83	# newer versions not in the default search path (from bgclang).
84	my $alcf_bu_dir = '/soft/compilers/bgclang/current/binutils/bin';
85	if (-d $alcf_bu_dir) {
86	$ENV{'PATH'} = $alcf_bu_dir . ':' . $ENV{'PATH'};
87	}
88
89	open(MEMLOG, $memlog_fn) \|\| die "Can't open $memlog_fn: $!";
90
91	# The first step is to determine the high-water mark.
92	my $max_rss = 0;
93	foreach my $line (<MEMLOG>) {
94	chomp($line);
95	my @parts = split(/\t/, $line);
96
97	my $op = shift(@parts);
98	my $state = shift(@parts);
99
100	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
101	if ($max_rss < $then_max_rss) {
102	$max_rss = $then_max_rss;
103	}
104	}
105
106	seek(MEMLOG, 0, 0);
107
108	# Scan the log for malloc/free pairings. We're interested only in active
109	# allocations at the time when the rss reaches the final maxrss.
110	# If we're finding leaks, then go to the very end.
111	my $active_alloc_time = 0;
112	my %malloc_lines;
113	foreach my $line (<MEMLOG>) {
114	chomp($line);
115	my @parts = split(/\t/, $line);
116
117	my $op = shift(@parts);
118	my $state = shift(@parts);
119
120	if ($op =~ /^M:/) {
121	my ($size, $ptr) = ($op =~ /^M: (\d+) 0x(\w+)/);
122	$malloc_lines{$ptr} = $line;
123	} elsif ($op =~ /^F:/) {
124	my ($ptr) = ($op =~ /^F: 0x(\w+)/);
125	delete $malloc_lines{$ptr};
126	} else {
127	next;
128	}
129
130	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
131	$active_alloc_time = $time;
132
133	if (!$find_leaks) {
134	# If we've reached the max rss, we've seen all we need to see.
135	if ($then_max_rss == $max_rss) {
136	last;
137	}
138	}
139	}
140
141	close(MEMLOG);
142
143	# Convert maxrss, currently in KB, to bytes.
144	$max_rss *= 1024;
145
146	my $total_size = 0;
147	my %roots;
148	my %all_nodes;
149	foreach my $line (values %malloc_lines) {
150	my @parts = split(/\t/, $line);
151
152	my $op = shift(@parts);
153	my $state = shift(@parts);
154
155	# Only dealing with allocations here...
156	if ($op !~ /^M:/) {
157	next;
158	}
159
160	my ($size, $ptr) = ($op =~ /^M: (\d+) 0x(\w+)/);
161	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
162
163	$total_size += $size;
164
165	sub level_parts($) {
166	my $level = @_[0];
167	my ($file_name, $proc_name, $off, $pc, $relpc) =
168	($level =~ /^(.) \((.)\+0x(\w+)\) \[0x(\w+) \(0x(\w+)\)\]/);
169
170	return ($file_name, $proc_name, $off, $pc, $relpc);
171	}
172
173	# Put the top of the stack first.
174	@parts = reverse(@parts);
175
176	my $parent = \%roots;
177	for (my $i = 0; $i < scalar(@parts); ++$i) {
178	my $level = $parts[$i];
179	my ($file_name, $proc_name, $off, $pc, $relpc) = level_parts($level);
180
181	# Skip this level if we don't even know from what file it came.
182	if ($file_name eq '?') {
183	next;
184	}
185
186	# print STDERR "parsed: $file_name, $proc_name, $off, $pc, $relpc\n";
187
188	if (!exists $all_nodes{$pc}) {
189	$all_nodes{$pc}->{'file_name'} = $file_name;
190	$all_nodes{$pc}->{'proc_name'} = $proc_name;
191	$all_nodes{$pc}->{'off'} = $off;
192	$all_nodes{$pc}->{'pc'} = $pc;
193	$all_nodes{$pc}->{'relpc'} = $relpc;
194	}
195
196	if (!exists $parent->{$pc}) {
197	$parent->{$pc} = $all_nodes{$pc};
198	}
199
200	$parent->{$pc}->{'size'} += $size;
201
202	my ($next_file_name, $next_proc_name, $next_off, $next_pc, $next_relpc);
203	if ($i < scalar(@parts)-1) {
204	my $next_level = $parts[$i+1];
205	($next_file_name, $next_proc_name, $next_off, $next_pc, $next_relpc) =
206	level_parts($next_level);
207	$parent->{$pc}->{'child_sizes'}->{$next_pc} += $size;
208	}
209
210	if (!exists $parent->{'children'}) {
211	$parent->{'children'} = {};
212	}
213
214	$parent = $parent->{'children'};
215	}
216	}
217
218	my $txt_fn = "$out_dir/" . basename($memlog_fn) . ".txt";
219	my $dot_fn = "$out_dir/" . basename($memlog_fn) . ".dot";
220	my $ps_fn = "$out_dir/" . basename($memlog_fn) . ".ps";
221	my $pdf_fn = "$out_dir/" . basename($memlog_fn) . ".pdf";
222
223	if (!$quiet) {
224	print "Creating $txt_fn\n";
225	}
226
227	open(TXT, ">$txt_fn") \|\| die "Can't open $txt_fn: $!";
228
229	if (!$quiet) {
230	print "Creating $dot_fn\n";
231	}
232
233	open(DOT, ">$dot_fn") \|\| die "Can't open $dot_fn: $!";
234
235	sub format_bytes($) {
236	my @sizes = qw( B KB MB GB TB PB );
237	my $size = $_[0];
238
239	my $i = 0;
240	while ($size > 1024) {
241	$size /= 1024;
242	++$i;
243	}
244
245	return sprintf("%.3f $sizes[$i]", $size);
246	}
247
248	print DOT ("digraph \"memlog\" {\n");
249	print DOT ("size=\"8,11\";\n");
250	print DOT ("node [width=0.375,height=0.25];\n");
251
252	my $find_type = $find_leaks ? " (leaks)" : "";
253	printf DOT ("Legend [shape=box, fontsize=100, shape=oval," .
254	"label=\"Total: %s active$find_type at maxrss = %s after %s s\"];\n",
255	format_bytes($total_size), format_bytes($max_rss),
256	$active_alloc_time);
257
258	printf TXT ("memlog: Total: %s active$find_type at maxrss = %s after %s s\n\n",
259	format_bytes($total_size), format_bytes($max_rss),
260	$active_alloc_time);
261
262	my %cached_names;
263	sub get_name($) {
264	my $node = $_[0];
265	my $pc = $node->{'pc'};
266
267	if (exists $cached_names{$pc}) {
268	return $cached_names{$pc};
269	}
270
271	my $ret = '';
272
273	# Prefer the relative offset (that is what we want for shared libraries), but
274	# if is not available, use the full offset (which is what we want for the
275	# base executable).
276	my $exe_off = $node->{'relpc'};
277	if (!$exe_off) {
278	$exe_off = $pc;
279	}
280
281	my $file_name = $node->{'file_name'};
282
283	# If we don't have an absolute path, this is probably the base dynamic
284	# executable, so ask the shell which one it used (not foolproof because we
285	# might not have the same PATH now, but hopefully is generally the right
286	# thing).
287	if ($file_name !~ /^\//) {
288	$file_name = `which '$file_name'`;
289	chomp($file_name);
290	}
291
292	my ($func, $loc) = `addr2line -e '$file_name' -f 0x$exe_off`;
293	chomp($func);
294	chomp($loc);
295
296	if ($func !~ /^\?/) {
297	# In general, this function name might look something like:
298	# 00000329.plt_call.wcsnrtombs@@GLIBC_2.3+0
299	$func =~ s/@.*//; # Remove trailing symbol version strings
300	$func =~ s/.*\.//;
301	$func = `c++filt '$func'`;
302	chomp($func);
303
304	# It sometimes happens that addr2line is a bit too smart: when debugging
305	# information is available, it might print a local alias for the
306	# function instead of the full name (for example, printing 'List'
307	# instead of 'Foo::List<int>::List(int, int const&)').
308	if ($node->{'proc_name'} ne '?') {
309	my $proc_name = $node->{'proc_name'};
310	$proc_name = `c++filt '$proc_name'`;
311	chomp($proc_name);
312
313	if (length($proc_name) > length($func)) {
314	$func = $proc_name;
315	}
316	}
317
318	$ret .= $func . '\n';
319
320	if ($loc !~ /^[:?]/) {
321	$ret .= $loc . '\n';
322	}
323	} elsif ($node->{'proc_name'} ne '?') {
324	my $proc_name = $node->{'proc_name'};
325	$proc_name = `c++filt '$proc_name'`;
326	chomp($proc_name);
327
328	$ret .= $proc_name . '\n';
329	}
330
331	$ret .= $node->{'file_name'};
332	if ($print_raw_proc_name and $node->{'proc_name'} ne '?') {
333	$ret .= '\n' . $node->{'proc_name'} . '+0x' . $node->{'off'};
334	}
335
336	$cached_names{$pc} = $ret;
337	return $ret;
338	}
339
340	my $skip_frac = 0.01;
341	my %skipped;
342
343	foreach my $pc (keys %all_nodes) {
344	my $node = $all_nodes{$pc};
345
346	my $local_size = $node->{'size'};
347	if ($local_size * 1.0 / $total_size < $skip_frac) {
348	$skipped{$pc} = 1;
349	next;
350	}
351
352	my $fs = 8.0;
353	if ($local_size > 0) {
354	$fs = 50.0 * (abs($local_size * 1.0 / $total_size))**0.125;
355	}
356
357	my $name = get_name($node);
358
359	printf DOT ("N%s [label=\"%s\\n%s\", shape=box, fontsize=%.1f%s];\n",
360	$pc, $name, format_bytes($local_size), $fs);
361	}
362
363	foreach my $pc (keys %all_nodes) {
364	if ($skipped{$pc}) {
365	next;
366	}
367
368	my $node = $all_nodes{$pc};
369	my $local_size = $node->{'size'};
370
371	foreach my $cpc (keys %{$node->{'child_sizes'}}) {
372	if ($skipped{$cpc}) {
373	next;
374	}
375
376	my $child_size = $node->{'child_sizes'}->{$cpc};
377	my $frac = $child_size * 1.0 / $local_size;
378
379	my $weight = 100.0 * sqrt($frac);
380	my $style = sprintf("setlinewidth(%f)", 8.0 * sqrt($frac));
381
382	my $fs = 40.0 * $frac**0.125;
383
384	printf DOT ("N%s -> N%s [label=\"%s\", weight=%d, style=\"%s\", fontsize=%.1f];\n",
385	$pc, $cpc, format_bytes($child_size), $weight, $style, $fs);
386	}
387	}
388
389	print DOT ("}\n");
390
391	foreach my $pc (sort { $all_nodes{$::b}->{'size'} <=>
392	$all_nodes{$::a}->{'size'} } keys %all_nodes) {
393	if ($skipped{$pc}) {
394	next;
395	}
396
397	print TXT ('*' x 80) . "\n\n";
398
399	my $node = $all_nodes{$pc};
400
401	my $local_size = $node->{'size'};
402	printf TXT ("%s - %.1f%%\n", format_bytes($local_size),
403	$local_size * 100.0 / $total_size);
404
405	my $name = get_name($node);
406	$name =~ s/\\n/\n/g;
407
408	print TXT "$name\n$pc\n";
409
410	print TXT "\nMEMORY ALLOCATED BY CALLEES:\n";
411
412	foreach my $cpc (sort { $node->{'child_sizes'}->{$::b} <=>
413	$node->{'child_sizes'}->{$::a} }
414	keys %{$node->{'child_sizes'}}) {
415	if ($skipped{$cpc}) {
416	next;
417	}
418
419	my $child_node = $all_nodes{$cpc};
420	my $child_size = $node->{'child_sizes'}->{$cpc};
421
422	printf TXT ("\t%s - %.1f%%\n", format_bytes($child_size),
423	$child_size * 100.0 / $local_size);
424
425	my $child_name = get_name($child_node);
426	$child_name =~ s/\\n/\n\t/g;
427	print TXT "\t$child_name\n\t$cpc\n";
428
429	print TXT "\n";
430	}
431
432	print TXT "\n";
433	}
434
435	close(TXT);
436	close(DOT);
437
438	if (!$quiet) {
439	print "Creating $ps_fn\n";
440	}
441
442	system("dot -Tps2 < '$dot_fn' > '$ps_fn'");
443
444	if (!$quiet) {
445	print "Creating $pdf_fn\n";
446	}
447
448	system("ps2pdf '$ps_fn' '$pdf_fn'");
449
450	exit 0;
451

Note: See TracBrowser for help on using the repository browser.

Download in other formats: