Context Navigation

source: memlog_analyze @ d270799

Revision d270799, 10.9 KB checked in by Hal Finkel <hfinkel@…>, 10 years ago (diff)
don't accept too many command-line parameters
Property mode set to `100755`

Rev	Line
[ebd57f8]	1	#! /usr/bin/env perl
	2	use strict;
	3	use File::Basename;
[c49b79c]	4	use Getopt::Long;
	5
[9fcaba3]	6	my $find_leaks = 0;
[c49b79c]	7	my $print_raw_proc_name = 0;
	8	my $quiet = 0;
	9	my $help = 0;
	10
	11	sub print_usage($) {
	12	my $ec = $_[0];
	13	my $usage = <<EOM;
[5df7203]	14	Usage: $0 [options] <memlog file or glob> [<output directory>]
[c49b79c]	15	options:
[9fcaba3]	16	--leaks
	17	Provide information on leaks instead of peak usage
[c49b79c]	18	--print-symbol-names
	19	Include symbol names and offsets in the output
	20	--quiet or -q
	21	Don't print status messages while running
	22	EOM
	23
	24	print $usage;
	25	exit($ec);
	26	}
	27
[3533094]	28	GetOptions("help\|h\|?" => \$help,
[9fcaba3]	29	"leaks" => \$find_leaks,
[c49b79c]	30	"print-symbol-names" => \$print_raw_proc_name,
	31	"quiet\|q" => \$quiet)
	32	or print_usage(1);
	33
	34	if ($help) {
	35	print_usage(0);
	36	}
[ebd57f8]	37
[d270799]	38	if (scalar(@ARGV) > 1) {
	39	print_usage(2);
	40	}
	41
[81dea5b]	42	my $memlog_fn = $ARGV[0];
	43	my $out_dir = $ARGV[1] \|\| '.';
	44
	45	if (! -f $memlog_fn) {
[5df7203]	46	my @pot_fns = glob($memlog_fn);
	47	if (scalar(@pot_fns)) {
	48	if (!$quiet) {
	49	print "Searching all files matching '$memlog_fn'\n";
	50	}
	51
	52	my $pot_max_rss = 0;
	53	my $pos_max_rss_fn;
	54	foreach my $pot_fn (@pot_fns) {
	55	my $last_line = `tail -n 1 '$pot_fn'`;
	56	chomp($last_line);
	57
	58	my @parts = split(/\t/, $last_line);
	59
	60	my $op = shift(@parts);
	61	my $state = shift(@parts);
	62
	63	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
	64	if ($pot_max_rss < $then_max_rss) {
	65	$pot_max_rss = $then_max_rss;
	66	$pos_max_rss_fn = $pot_fn;
	67	}
	68	}
	69
	70	if (defined $pos_max_rss_fn) {
	71	$memlog_fn = $pos_max_rss_fn;
	72	goto have_memlog_fn;
	73	}
	74	}
	75
[c49b79c]	76	print_usage(1);
[81dea5b]	77	}
[5df7203]	78	have_memlog_fn:
[81dea5b]	79
[747d2b1]	80	# The version of addr2line and friends that you use can make a big difference,
	81	# especially on BE ppc64, where older versions of addr2line did not account
	82	# correctly for the function descriptor setup. At ALCF, on the BG/Q, we have
	83	# newer versions not in the default search path (from bgclang).
	84	my $alcf_bu_dir = '/soft/compilers/bgclang/current/binutils/bin';
	85	if (-d $alcf_bu_dir) {
	86	$ENV{'PATH'} = $alcf_bu_dir . ':' . $ENV{'PATH'};
	87	}
	88
[81dea5b]	89	open(MEMLOG, $memlog_fn) \|\| die "Can't open $memlog_fn: $!";
	90
[0edbc98]	91	# The first step is to determine the high-water mark.
	92	my $max_rss = 0;
	93	foreach my $line (<MEMLOG>) {
	94	chomp($line);
	95	my @parts = split(/\t/, $line);
	96
	97	my $op = shift(@parts);
	98	my $state = shift(@parts);
	99
	100	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
	101	if ($max_rss < $then_max_rss) {
	102	$max_rss = $then_max_rss;
	103	}
	104	}
	105
	106	seek(MEMLOG, 0, 0);
	107
	108	# Scan the log for malloc/free pairings. We're interested only in active
	109	# allocations at the time when the rss reaches the final maxrss.
[9fcaba3]	110	# If we're finding leaks, then go to the very end.
	111	my $active_alloc_time = 0;
[0edbc98]	112	my %malloc_lines;
	113	foreach my $line (<MEMLOG>) {
	114	chomp($line);
	115	my @parts = split(/\t/, $line);
	116
	117	my $op = shift(@parts);
	118	my $state = shift(@parts);
	119
	120	if ($op =~ /^M:/) {
	121	my ($size, $ptr) = ($op =~ /^M: (\d+) 0x(\w+)/);
	122	$malloc_lines{$ptr} = $line;
	123	} elsif ($op =~ /^F:/) {
	124	my ($ptr) = ($op =~ /^F: 0x(\w+)/);
	125	delete $malloc_lines{$ptr};
	126	} else {
	127	next;
	128	}
	129
	130	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
[9fcaba3]	131	$active_alloc_time = $time;
	132
	133	if (!$find_leaks) {
	134	# If we've reached the max rss, we've seen all we need to see.
	135	if ($then_max_rss == $max_rss) {
	136	last;
	137	}
[0edbc98]	138	}
	139	}
	140
	141	close(MEMLOG);
	142
	143	# Convert maxrss, currently in KB, to bytes.
	144	$max_rss *= 1024;
	145
[ebd57f8]	146	my $total_size = 0;
	147	my %roots;
[c4f89cf]	148	my %all_nodes;
[0edbc98]	149	foreach my $line (values %malloc_lines) {
[ebd57f8]	150	my @parts = split(/\t/, $line);
	151
	152	my $op = shift(@parts);
	153	my $state = shift(@parts);
	154
	155	# Only dealing with allocations here...
	156	if ($op !~ /^M:/) {
	157	next;
	158	}
	159
	160	my ($size, $ptr) = ($op =~ /^M: (\d+) 0x(\w+)/);
[0edbc98]	161	my ($time, $then_max_rss, $tid) = split(/\s+/, $state);
[ebd57f8]	162
	163	$total_size += $size;
	164
	165	sub level_parts($) {
	166	my $level = @_[0];
	167	my ($file_name, $proc_name, $off, $pc, $relpc) =
	168	($level =~ /^(.) \((.)\+0x(\w+)\) \[0x(\w+) \(0x(\w+)\)\]/);
	169
	170	return ($file_name, $proc_name, $off, $pc, $relpc);
	171	}
	172
	173	# Put the top of the stack first.
	174	@parts = reverse(@parts);
	175
	176	my $parent = \%roots;
	177	for (my $i = 0; $i < scalar(@parts); ++$i) {
	178	my $level = $parts[$i];
	179	my ($file_name, $proc_name, $off, $pc, $relpc) = level_parts($level);
	180
	181	# Skip this level if we don't even know from what file it came.
	182	if ($file_name eq '?') {
	183	next;
	184	}
	185
	186	# print STDERR "parsed: $file_name, $proc_name, $off, $pc, $relpc\n";
	187
[c4f89cf]	188	if (!exists $all_nodes{$pc}) {
	189	$all_nodes{$pc}->{'file_name'} = $file_name;
	190	$all_nodes{$pc}->{'proc_name'} = $proc_name;
	191	$all_nodes{$pc}->{'off'} = $off;
	192	$all_nodes{$pc}->{'pc'} = $pc;
	193	$all_nodes{$pc}->{'relpc'} = $relpc;
	194	}
[ebd57f8]	195
[c4f89cf]	196	if (!exists $parent->{$pc}) {
	197	$parent->{$pc} = $all_nodes{$pc};
[ebd57f8]	198	}
	199
	200	$parent->{$pc}->{'size'} += $size;
	201
	202	my ($next_file_name, $next_proc_name, $next_off, $next_pc, $next_relpc);
	203	if ($i < scalar(@parts)-1) {
	204	my $next_level = $parts[$i+1];
	205	($next_file_name, $next_proc_name, $next_off, $next_pc, $next_relpc) =
	206	level_parts($next_level);
	207	$parent->{$pc}->{'child_sizes'}->{$next_pc} += $size;
	208	}
	209
	210	if (!exists $parent->{'children'}) {
	211	$parent->{'children'} = {};
	212	}
	213
	214	$parent = $parent->{'children'};
	215	}
	216	}
	217
[20b45de]	218	my $txt_fn = "$out_dir/" . basename($memlog_fn) . ".txt";
[81dea5b]	219	my $dot_fn = "$out_dir/" . basename($memlog_fn) . ".dot";
	220	my $ps_fn = "$out_dir/" . basename($memlog_fn) . ".ps";
	221	my $pdf_fn = "$out_dir/" . basename($memlog_fn) . ".pdf";
	222
[c49b79c]	223	if (!$quiet) {
	224	print "Creating $txt_fn\n";
	225	}
	226
[20b45de]	227	open(TXT, ">$txt_fn") \|\| die "Can't open $txt_fn: $!";
[c49b79c]	228
	229	if (!$quiet) {
	230	print "Creating $dot_fn\n";
	231	}
	232
[81dea5b]	233	open(DOT, ">$dot_fn") \|\| die "Can't open $dot_fn: $!";
	234
[ebd57f8]	235	sub format_bytes($) {
	236	my @sizes = qw( B KB MB GB TB PB );
	237	my $size = $_[0];
	238
	239	my $i = 0;
	240	while ($size > 1024) {
	241	$size /= 1024;
	242	++$i;
	243	}
	244
[4bd7a88]	245	return sprintf("%.3f $sizes[$i]", $size);
[ebd57f8]	246	}
	247
[bdaf020]	248	print DOT ("digraph \"memlog\" {\n");
[81dea5b]	249	print DOT ("size=\"8,11\";\n");
	250	print DOT ("node [width=0.375,height=0.25];\n");
[ebd57f8]	251
[9fcaba3]	252	my $find_type = $find_leaks ? " (leaks)" : "";
[bdaf020]	253	printf DOT ("Legend [shape=box, fontsize=100, shape=oval," .
[9fcaba3]	254	"label=\"Total: %s active$find_type at maxrss = %s after %s s\"];\n",
	255	format_bytes($total_size), format_bytes($max_rss),
	256	$active_alloc_time);
[bdaf020]	257
[9fcaba3]	258	printf TXT ("memlog: Total: %s active$find_type at maxrss = %s after %s s\n\n",
	259	format_bytes($total_size), format_bytes($max_rss),
	260	$active_alloc_time);
[20b45de]	261
[ebd57f8]	262	my %cached_names;
	263	sub get_name($) {
	264	my $node = $_[0];
	265	my $pc = $node->{'pc'};
	266
	267	if (exists $cached_names{$pc}) {
	268	return $cached_names{$pc};
	269	}
	270
	271	my $ret = '';
	272
	273	# Prefer the relative offset (that is what we want for shared libraries), but
	274	# if is not available, use the full offset (which is what we want for the
	275	# base executable).
	276	my $exe_off = $node->{'relpc'};
	277	if (!$exe_off) {
	278	$exe_off = $pc;
	279	}
	280
	281	my $file_name = $node->{'file_name'};
[518793d]	282
	283	# If we don't have an absolute path, this is probably the base dynamic
	284	# executable, so ask the shell which one it used (not foolproof because we
	285	# might not have the same PATH now, but hopefully is generally the right
	286	# thing).
	287	if ($file_name !~ /^\//) {
	288	$file_name = `which '$file_name'`;
	289	chomp($file_name);
	290	}
	291
	292	my ($func, $loc) = `addr2line -e '$file_name' -f 0x$exe_off`;
[ebd57f8]	293	chomp($func);
	294	chomp($loc);
	295
	296	if ($func !~ /^\?/) {
[6520ef5]	297	# In general, this function name might look something like:
	298	# 00000329.plt_call.wcsnrtombs@@GLIBC_2.3+0
[10599da]	299	$func =~ s/@.*//; # Remove trailing symbol version strings
[ebd57f8]	300	$func =~ s/.*\.//;
	301	$func = `c++filt '$func'`;
	302	chomp($func);
	303
[1bd82e0]	304	# It sometimes happens that addr2line is a bit too smart: when debugging
	305	# information is available, it might print a local alias for the
	306	# function instead of the full name (for example, printing 'List'
	307	# instead of 'Foo::List<int>::List(int, int const&)').
	308	if ($node->{'proc_name'} ne '?') {
	309	my $proc_name = $node->{'proc_name'};
	310	$proc_name = `c++filt '$proc_name'`;
	311	chomp($proc_name);
	312
	313	if (length($proc_name) > length($func)) {
	314	$func = $proc_name;
	315	}
	316	}
	317
[081a0fa]	318	$ret .= $func . '\n';
	319
[77ebdb8]	320	if ($loc !~ /^[:?]/) {
[081a0fa]	321	$ret .= $loc . '\n';
	322	}
[4bd7a88]	323	} elsif ($node->{'proc_name'} ne '?') {
	324	my $proc_name = $node->{'proc_name'};
	325	$proc_name = `c++filt '$proc_name'`;
	326	chomp($proc_name);
	327
	328	$ret .= $proc_name . '\n';
[ebd57f8]	329	}
	330
[6bfe6a1]	331	$ret .= $node->{'file_name'};
	332	if ($print_raw_proc_name and $node->{'proc_name'} ne '?') {
	333	$ret .= '\n' . $node->{'proc_name'} . '+0x' . $node->{'off'};
[ebd57f8]	334	}
	335
	336	$cached_names{$pc} = $ret;
	337	return $ret;
	338	}
	339
[4bd7a88]	340	my $skip_frac = 0.01;
	341	my %skipped;
	342
[c4f89cf]	343	foreach my $pc (keys %all_nodes) {
	344	my $node = $all_nodes{$pc};
[ebd57f8]	345
	346	my $local_size = $node->{'size'};
[4bd7a88]	347	if ($local_size * 1.0 / $total_size < $skip_frac) {
[c4f89cf]	348	$skipped{$pc} = 1;
[4bd7a88]	349	next;
	350	}
[ebd57f8]	351
	352	my $fs = 8.0;
	353	if ($local_size > 0) {
[4bd7a88]	354	$fs = 50.0 * (abs($local_size * 1.0 / $total_size))**0.125;
[ebd57f8]	355	}
	356
[20b45de]	357	my $name = get_name($node);
	358
[81dea5b]	359	printf DOT ("N%s [label=\"%s\\n%s\", shape=box, fontsize=%.1f%s];\n",
[c4f89cf]	360	$pc, $name, format_bytes($local_size), $fs);
[ebd57f8]	361	}
	362
[c4f89cf]	363	foreach my $pc (keys %all_nodes) {
	364	if ($skipped{$pc}) {
[4bd7a88]	365	next;
	366	}
[ebd57f8]	367
[20b45de]	368	my $node = $all_nodes{$pc};
	369	my $local_size = $node->{'size'};
	370
[ebd57f8]	371	foreach my $cpc (keys %{$node->{'child_sizes'}}) {
[4bd7a88]	372	if ($skipped{$cpc}) {
	373	next;
	374	}
	375
[ebd57f8]	376	my $child_size = $node->{'child_sizes'}->{$cpc};
	377	my $frac = $child_size * 1.0 / $local_size;
	378
[4bd7a88]	379	my $weight = 100.0 * sqrt($frac);
[6520ef5]	380	my $style = sprintf("setlinewidth(%f)", 8.0 * sqrt($frac));
[ebd57f8]	381
[6520ef5]	382	my $fs = 40.0 * $frac**0.125;
	383
[81dea5b]	384	printf DOT ("N%s -> N%s [label=\"%s\", weight=%d, style=\"%s\", fontsize=%.1f];\n",
[6520ef5]	385	$pc, $cpc, format_bytes($child_size), $weight, $style, $fs);
[ebd57f8]	386	}
	387	}
	388
[81dea5b]	389	print DOT ("}\n");
	390
[20b45de]	391	foreach my $pc (sort { $all_nodes{$::b}->{'size'} <=>
	392	$all_nodes{$::a}->{'size'} } keys %all_nodes) {
	393	if ($skipped{$pc}) {
	394	next;
	395	}
	396
	397	print TXT ('*' x 80) . "\n\n";
	398
	399	my $node = $all_nodes{$pc};
	400
	401	my $local_size = $node->{'size'};
	402	printf TXT ("%s - %.1f%%\n", format_bytes($local_size),
	403	$local_size * 100.0 / $total_size);
	404
	405	my $name = get_name($node);
	406	$name =~ s/\\n/\n/g;
	407
	408	print TXT "$name\n$pc\n";
	409
	410	print TXT "\nMEMORY ALLOCATED BY CALLEES:\n";
	411
	412	foreach my $cpc (sort { $node->{'child_sizes'}->{$::b} <=>
	413	$node->{'child_sizes'}->{$::a} }
	414	keys %{$node->{'child_sizes'}}) {
	415	if ($skipped{$cpc}) {
	416	next;
	417	}
	418
	419	my $child_node = $all_nodes{$cpc};
	420	my $child_size = $node->{'child_sizes'}->{$cpc};
	421
	422	printf TXT ("\t%s - %.1f%%\n", format_bytes($child_size),
	423	$child_size * 100.0 / $local_size);
	424
	425	my $child_name = get_name($child_node);
	426	$child_name =~ s/\\n/\n\t/g;
	427	print TXT "\t$child_name\n\t$cpc\n";
	428
	429	print TXT "\n";
	430	}
	431
	432	print TXT "\n";
	433	}
	434
	435	close(TXT);
[81dea5b]	436	close(DOT);
	437
[c49b79c]	438	if (!$quiet) {
	439	print "Creating $ps_fn\n";
	440	}
	441
[81dea5b]	442	system("dot -Tps2 < '$dot_fn' > '$ps_fn'");
[c49b79c]	443
	444	if (!$quiet) {
	445	print "Creating $pdf_fn\n";
	446	}
	447
[81dea5b]	448	system("ps2pdf '$ps_fn' '$pdf_fn'");
	449
	450	exit 0;
[ebd57f8]	451

Note: See TracBrowser for help on using the repository browser.

Download in other formats: