Linux Audio

Check our new training course

Yocto / OpenEmbedded training

Mar 24-27, 2025, special US time zones
Register
Loading...
v3.5.6
   1#!/usr/bin/perl -w
 
 
   2# (c) 2007, Joe Perches <joe@perches.com>
   3#           created from checkpatch.pl
   4#
   5# Print selected MAINTAINERS information for
   6# the files modified in a patch or for a file
   7#
   8# usage: perl scripts/get_maintainer.pl [OPTIONS] <patch>
   9#        perl scripts/get_maintainer.pl [OPTIONS] -f <file>
  10#
  11# Licensed under the terms of the GNU GPL License version 2
  12
 
  13use strict;
  14
  15my $P = $0;
  16my $V = '0.26';
  17
  18use Getopt::Long qw(:config no_auto_abbrev);
 
 
 
 
  19
 
  20my $lk_path = "./";
  21my $email = 1;
  22my $email_usename = 1;
  23my $email_maintainer = 1;
 
 
  24my $email_list = 1;
 
  25my $email_subscriber_list = 0;
  26my $email_git_penguin_chiefs = 0;
  27my $email_git = 0;
  28my $email_git_all_signature_types = 0;
  29my $email_git_blame = 0;
  30my $email_git_blame_signatures = 1;
  31my $email_git_fallback = 1;
  32my $email_git_min_signatures = 1;
  33my $email_git_max_maintainers = 5;
  34my $email_git_min_percent = 5;
  35my $email_git_since = "1-year-ago";
  36my $email_hg_since = "-365";
  37my $interactive = 0;
  38my $email_remove_duplicates = 1;
  39my $email_use_mailmap = 1;
  40my $output_multiline = 1;
  41my $output_separator = ", ";
  42my $output_roles = 0;
  43my $output_rolestats = 1;
 
  44my $scm = 0;
 
  45my $web = 0;
  46my $subsystem = 0;
  47my $status = 0;
 
  48my $keywords = 1;
 
  49my $sections = 0;
  50my $file_emails = 0;
  51my $from_filename = 0;
  52my $pattern_depth = 0;
 
  53my $version = 0;
  54my $help = 0;
  55
 
  56my $vcs_used = 0;
  57
  58my $exit = 0;
  59
 
 
 
 
 
 
  60my %commit_author_hash;
  61my %commit_signer_hash;
  62
  63my @penguin_chief = ();
  64push(@penguin_chief, "Linus Torvalds:torvalds\@linux-foundation.org");
  65#Andrew wants in on most everything - 2009/01/14
  66#push(@penguin_chief, "Andrew Morton:akpm\@linux-foundation.org");
  67
  68my @penguin_chief_names = ();
  69foreach my $chief (@penguin_chief) {
  70    if ($chief =~ m/^(.*):(.*)/) {
  71	my $chief_name = $1;
  72	my $chief_addr = $2;
  73	push(@penguin_chief_names, $chief_name);
  74    }
  75}
  76my $penguin_chiefs = "\(" . join("|", @penguin_chief_names) . "\)";
  77
  78# Signature types of people who are either
  79# 	a) responsible for the code in question, or
  80# 	b) familiar enough with it to give relevant feedback
  81my @signature_tags = ();
  82push(@signature_tags, "Signed-off-by:");
  83push(@signature_tags, "Reviewed-by:");
  84push(@signature_tags, "Acked-by:");
  85
  86my $signature_pattern = "\(" . join("|", @signature_tags) . "\)";
  87
  88# rfc822 email address - preloaded methods go here.
  89my $rfc822_lwsp = "(?:(?:\\r\\n)?[ \\t])";
  90my $rfc822_char = '[\\000-\\377]';
  91
  92# VCS command support: class-like functions and strings
  93
  94my %VCS_cmds;
  95
  96my %VCS_cmds_git = (
  97    "execute_cmd" => \&git_execute_cmd,
  98    "available" => '(which("git") ne "") && (-d ".git")',
  99    "find_signers_cmd" =>
 100	"git log --no-color --follow --since=\$email_git_since " .
 
 101	    '--format="GitCommit: %H%n' .
 102		      'GitAuthor: %an <%ae>%n' .
 103		      'GitDate: %aD%n' .
 104		      'GitSubject: %s%n' .
 105		      '%b%n"' .
 106	    " -- \$file",
 107    "find_commit_signers_cmd" =>
 108	"git log --no-color " .
 
 109	    '--format="GitCommit: %H%n' .
 110		      'GitAuthor: %an <%ae>%n' .
 111		      'GitDate: %aD%n' .
 112		      'GitSubject: %s%n' .
 113		      '%b%n"' .
 114	    " -1 \$commit",
 115    "find_commit_author_cmd" =>
 116	"git log --no-color " .
 
 117	    '--format="GitCommit: %H%n' .
 118		      'GitAuthor: %an <%ae>%n' .
 119		      'GitDate: %aD%n' .
 120		      'GitSubject: %s%n"' .
 121	    " -1 \$commit",
 122    "blame_range_cmd" => "git blame -l -L \$diff_start,+\$diff_length \$file",
 123    "blame_file_cmd" => "git blame -l \$file",
 124    "commit_pattern" => "^GitCommit: ([0-9a-f]{40,40})",
 125    "blame_commit_pattern" => "^([0-9a-f]+) ",
 126    "author_pattern" => "^GitAuthor: (.*)",
 127    "subject_pattern" => "^GitSubject: (.*)",
 
 
 
 128);
 129
 130my %VCS_cmds_hg = (
 131    "execute_cmd" => \&hg_execute_cmd,
 132    "available" => '(which("hg") ne "") && (-d ".hg")',
 133    "find_signers_cmd" =>
 134	"hg log --date=\$email_hg_since " .
 135	    "--template='HgCommit: {node}\\n" .
 136	                "HgAuthor: {author}\\n" .
 137			"HgSubject: {desc}\\n'" .
 138	    " -- \$file",
 139    "find_commit_signers_cmd" =>
 140	"hg log " .
 141	    "--template='HgSubject: {desc}\\n'" .
 142	    " -r \$commit",
 143    "find_commit_author_cmd" =>
 144	"hg log " .
 145	    "--template='HgCommit: {node}\\n" .
 146		        "HgAuthor: {author}\\n" .
 147			"HgSubject: {desc|firstline}\\n'" .
 148	    " -r \$commit",
 149    "blame_range_cmd" => "",		# not supported
 150    "blame_file_cmd" => "hg blame -n \$file",
 151    "commit_pattern" => "^HgCommit: ([0-9a-f]{40,40})",
 152    "blame_commit_pattern" => "^([ 0-9a-f]+):",
 153    "author_pattern" => "^HgAuthor: (.*)",
 154    "subject_pattern" => "^HgSubject: (.*)",
 
 
 
 155);
 156
 157my $conf = which_conf(".get_maintainer.conf");
 158if (-f $conf) {
 159    my @conf_args;
 160    open(my $conffile, '<', "$conf")
 161	or warn "$P: Can't find a readable .get_maintainer.conf file $!\n";
 162
 163    while (<$conffile>) {
 164	my $line = $_;
 165
 166	$line =~ s/\s*\n?$//g;
 167	$line =~ s/^\s*//g;
 168	$line =~ s/\s+/ /g;
 169
 170	next if ($line =~ m/^\s*#/);
 171	next if ($line =~ m/^\s*$/);
 172
 173	my @words = split(" ", $line);
 174	foreach my $word (@words) {
 175	    last if ($word =~ m/^#/);
 176	    push (@conf_args, $word);
 177	}
 178    }
 179    close($conffile);
 180    unshift(@ARGV, @conf_args) if @conf_args;
 181}
 182
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 183if (!GetOptions(
 184		'email!' => \$email,
 185		'git!' => \$email_git,
 186		'git-all-signature-types!' => \$email_git_all_signature_types,
 187		'git-blame!' => \$email_git_blame,
 188		'git-blame-signatures!' => \$email_git_blame_signatures,
 189		'git-fallback!' => \$email_git_fallback,
 190		'git-chief-penguins!' => \$email_git_penguin_chiefs,
 191		'git-min-signatures=i' => \$email_git_min_signatures,
 192		'git-max-maintainers=i' => \$email_git_max_maintainers,
 193		'git-min-percent=i' => \$email_git_min_percent,
 194		'git-since=s' => \$email_git_since,
 195		'hg-since=s' => \$email_hg_since,
 196		'i|interactive!' => \$interactive,
 197		'remove-duplicates!' => \$email_remove_duplicates,
 198		'mailmap!' => \$email_use_mailmap,
 199		'm!' => \$email_maintainer,
 
 200		'n!' => \$email_usename,
 201		'l!' => \$email_list,
 
 
 202		's!' => \$email_subscriber_list,
 203		'multiline!' => \$output_multiline,
 204		'roles!' => \$output_roles,
 205		'rolestats!' => \$output_rolestats,
 206		'separator=s' => \$output_separator,
 207		'subsystem!' => \$subsystem,
 208		'status!' => \$status,
 209		'scm!' => \$scm,
 
 210		'web!' => \$web,
 
 211		'pattern-depth=i' => \$pattern_depth,
 212		'k|keywords!' => \$keywords,
 
 213		'sections!' => \$sections,
 214		'fe|file-emails!' => \$file_emails,
 215		'f|file' => \$from_filename,
 
 
 
 216		'v|version' => \$version,
 217		'h|help|usage' => \$help,
 218		)) {
 219    die "$P: invalid argument - use --help if necessary\n";
 220}
 221
 222if ($help != 0) {
 223    usage();
 224    exit 0;
 225}
 226
 227if ($version != 0) {
 228    print("${P} ${V}\n");
 229    exit 0;
 230}
 231
 
 
 
 
 
 
 232if (-t STDIN && !@ARGV) {
 233    # We're talking to a terminal, but have no command line arguments.
 234    die "$P: missing patchfile or -f file - use --help if necessary\n";
 235}
 236
 237$output_multiline = 0 if ($output_separator ne ", ");
 238$output_rolestats = 1 if ($interactive);
 239$output_roles = 1 if ($output_rolestats);
 240
 241if ($sections) {
 
 242    $email = 0;
 243    $email_list = 0;
 244    $scm = 0;
 245    $status = 0;
 246    $subsystem = 0;
 247    $web = 0;
 248    $keywords = 0;
 
 249    $interactive = 0;
 250} else {
 251    my $selections = $email + $scm + $status + $subsystem + $web;
 252    if ($selections == 0) {
 253	die "$P:  Missing required option: email, scm, status, subsystem or web\n";
 254    }
 255}
 256
 257if ($email &&
 258    ($email_maintainer + $email_list + $email_subscriber_list +
 
 259     $email_git + $email_git_penguin_chiefs + $email_git_blame) == 0) {
 260    die "$P: Please select at least 1 email option\n";
 261}
 262
 263if (!top_of_kernel_tree($lk_path)) {
 264    die "$P: The current directory does not appear to be "
 265	. "a linux kernel source tree.\n";
 266}
 267
 268## Read MAINTAINERS for type/value pairs
 269
 270my @typevalue = ();
 271my %keyword_hash;
 
 
 272
 273open (my $maint, '<', "${lk_path}MAINTAINERS")
 274    or die "$P: Can't open MAINTAINERS: $!\n";
 275while (<$maint>) {
 276    my $line = $_;
 277
 278    if ($line =~ m/^(\C):\s*(.*)/) {
 279	my $type = $1;
 280	my $value = $2;
 
 
 
 281
 282	##Filename pattern matching
 283	if ($type eq "F" || $type eq "X") {
 284	    $value =~ s@\.@\\\.@g;       ##Convert . to \.
 285	    $value =~ s/\*/\.\*/g;       ##Convert * to .*
 286	    $value =~ s/\?/\./g;         ##Convert ? to .
 287	    ##if pattern is a directory and it lacks a trailing slash, add one
 288	    if ((-d $value)) {
 289		$value =~ s@([^/])$@$1/@;
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 290	    }
 291	} elsif ($type eq "K") {
 292	    $keyword_hash{@typevalue} = $value;
 293	}
 294	push(@typevalue, "$type:$value");
 295    } elsif (!/^(\s)*$/) {
 296	$line =~ s/\n$//g;
 297	push(@typevalue, $line);
 
 
 
 
 298    }
 299}
 300close($maint);
 301
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 302
 303#
 304# Read mail address map
 305#
 306
 307my $mailmap;
 308
 309read_mailmap();
 310
 311sub read_mailmap {
 312    $mailmap = {
 313	names => {},
 314	addresses => {}
 315    };
 316
 317    return if (!$email_use_mailmap || !(-f "${lk_path}.mailmap"));
 318
 319    open(my $mailmap_file, '<', "${lk_path}.mailmap")
 320	or warn "$P: Can't open .mailmap: $!\n";
 321
 322    while (<$mailmap_file>) {
 323	s/#.*$//; #strip comments
 324	s/^\s+|\s+$//g; #trim
 325
 326	next if (/^\s*$/); #skip empty lines
 327	#entries have one of the following formats:
 328	# name1 <mail1>
 329	# <mail1> <mail2>
 330	# name1 <mail1> <mail2>
 331	# name1 <mail1> name2 <mail2>
 332	# (see man git-shortlog)
 333
 334	if (/^([^<]+)<([^>]+)>$/) {
 335	    my $real_name = $1;
 336	    my $address = $2;
 337
 338	    $real_name =~ s/\s+$//;
 339	    ($real_name, $address) = parse_email("$real_name <$address>");
 340	    $mailmap->{names}->{$address} = $real_name;
 341
 342	} elsif (/^<([^>]+)>\s*<([^>]+)>$/) {
 343	    my $real_address = $1;
 344	    my $wrong_address = $2;
 345
 346	    $mailmap->{addresses}->{$wrong_address} = $real_address;
 347
 348	} elsif (/^(.+)<([^>]+)>\s*<([^>]+)>$/) {
 349	    my $real_name = $1;
 350	    my $real_address = $2;
 351	    my $wrong_address = $3;
 352
 353	    $real_name =~ s/\s+$//;
 354	    ($real_name, $real_address) =
 355		parse_email("$real_name <$real_address>");
 356	    $mailmap->{names}->{$wrong_address} = $real_name;
 357	    $mailmap->{addresses}->{$wrong_address} = $real_address;
 358
 359	} elsif (/^(.+)<([^>]+)>\s*(.+)\s*<([^>]+)>$/) {
 360	    my $real_name = $1;
 361	    my $real_address = $2;
 362	    my $wrong_name = $3;
 363	    my $wrong_address = $4;
 364
 365	    $real_name =~ s/\s+$//;
 366	    ($real_name, $real_address) =
 367		parse_email("$real_name <$real_address>");
 368
 369	    $wrong_name =~ s/\s+$//;
 370	    ($wrong_name, $wrong_address) =
 371		parse_email("$wrong_name <$wrong_address>");
 372
 373	    my $wrong_email = format_email($wrong_name, $wrong_address, 1);
 374	    $mailmap->{names}->{$wrong_email} = $real_name;
 375	    $mailmap->{addresses}->{$wrong_email} = $real_address;
 376	}
 377    }
 378    close($mailmap_file);
 379}
 380
 381## use the filenames on the command line or find the filenames in the patchfiles
 382
 383my @files = ();
 384my @range = ();
 385my @keyword_tvi = ();
 386my @file_emails = ();
 387
 388if (!@ARGV) {
 389    push(@ARGV, "&STDIN");
 390}
 391
 392foreach my $file (@ARGV) {
 393    if ($file ne "&STDIN") {
 
 394	##if $file is a directory and it lacks a trailing slash, add one
 395	if ((-d $file)) {
 396	    $file =~ s@([^/])$@$1/@;
 397	} elsif (!(-f $file)) {
 398	    die "$P: file '${file}' not found\n";
 399	}
 400    }
 401    if ($from_filename) {
 
 
 
 
 
 402	push(@files, $file);
 403	if ($file ne "MAINTAINERS" && -f $file && ($keywords || $file_emails)) {
 404	    open(my $f, '<', $file)
 405		or die "$P: Can't open $file: $!\n";
 406	    my $text = do { local($/) ; <$f> };
 407	    close($f);
 408	    if ($keywords) {
 409		foreach my $line (keys %keyword_hash) {
 410		    if ($text =~ m/$keyword_hash{$line}/x) {
 411			push(@keyword_tvi, $line);
 412		    }
 413		}
 414	    }
 415	    if ($file_emails) {
 416		my @poss_addr = $text =~ m$[A-Za-zÀ-ÿ\"\' \,\.\+-]*\s*[\,]*\s*[\(\<\{]{0,1}[A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+\.[A-Za-z0-9]+[\)\>\}]{0,1}$g;
 417		push(@file_emails, clean_file_emails(@poss_addr));
 418	    }
 419	}
 420    } else {
 421	my $file_cnt = @files;
 422	my $lastfile;
 423
 424	open(my $patch, "< $file")
 425	    or die "$P: Can't open $file: $!\n";
 426
 427	# We can check arbitrary information before the patch
 428	# like the commit message, mail headers, etc...
 429	# This allows us to match arbitrary keywords against any part
 430	# of a git format-patch generated file (subject tags, etc...)
 431
 432	my $patch_prefix = "";			#Parsing the intro
 433
 434	while (<$patch>) {
 435	    my $patch_line = $_;
 436	    if (m/^\+\+\+\s+(\S+)/) {
 
 
 
 
 
 
 
 
 
 
 
 
 
 437		my $filename = $1;
 438		$filename =~ s@^[^/]*/@@;
 439		$filename =~ s@\n@@;
 440		$lastfile = $filename;
 441		push(@files, $filename);
 442		$patch_prefix = "^[+-].*";	#Now parsing the actual patch
 443	    } elsif (m/^\@\@ -(\d+),(\d+)/) {
 444		if ($email_git_blame) {
 445		    push(@range, "$lastfile:$1:$2");
 446		}
 447	    } elsif ($keywords) {
 448		foreach my $line (keys %keyword_hash) {
 449		    if ($patch_line =~ m/${patch_prefix}$keyword_hash{$line}/x) {
 450			push(@keyword_tvi, $line);
 451		    }
 452		}
 453	    }
 454	}
 455	close($patch);
 456
 457	if ($file_cnt == @files) {
 458	    warn "$P: file '${file}' doesn't appear to be a patch.  "
 459		. "Add -f to options?\n";
 460	}
 461	@files = sort_and_uniq(@files);
 462    }
 463}
 464
 465@file_emails = uniq(@file_emails);
 
 466
 467my %email_hash_name;
 468my %email_hash_address;
 469my @email_to = ();
 470my %hash_list_to;
 471my @list_to = ();
 472my @scm = ();
 473my @web = ();
 474my @subsystem = ();
 475my @status = ();
 476my %deduplicate_name_hash = ();
 477my %deduplicate_address_hash = ();
 478
 479my @maintainers = get_maintainers();
 480
 481if (@maintainers) {
 482    @maintainers = merge_email(@maintainers);
 483    output(@maintainers);
 484}
 485
 486if ($scm) {
 487    @scm = uniq(@scm);
 488    output(@scm);
 489}
 490
 491if ($status) {
 492    @status = uniq(@status);
 493    output(@status);
 494}
 495
 496if ($subsystem) {
 497    @subsystem = uniq(@subsystem);
 498    output(@subsystem);
 499}
 500
 501if ($web) {
 502    @web = uniq(@web);
 503    output(@web);
 504}
 505
 506exit($exit);
 507
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 508sub range_is_maintained {
 509    my ($start, $end) = @_;
 510
 511    for (my $i = $start; $i < $end; $i++) {
 512	my $line = $typevalue[$i];
 513	if ($line =~ m/^(\C):\s*(.*)/) {
 514	    my $type = $1;
 515	    my $value = $2;
 516	    if ($type eq 'S') {
 517		if ($value =~ /(maintain|support)/i) {
 518		    return 1;
 519		}
 520	    }
 521	}
 522    }
 523    return 0;
 524}
 525
 526sub range_has_maintainer {
 527    my ($start, $end) = @_;
 528
 529    for (my $i = $start; $i < $end; $i++) {
 530	my $line = $typevalue[$i];
 531	if ($line =~ m/^(\C):\s*(.*)/) {
 532	    my $type = $1;
 533	    my $value = $2;
 534	    if ($type eq 'M') {
 535		return 1;
 536	    }
 537	}
 538    }
 539    return 0;
 540}
 541
 542sub get_maintainers {
 543    %email_hash_name = ();
 544    %email_hash_address = ();
 545    %commit_author_hash = ();
 546    %commit_signer_hash = ();
 547    @email_to = ();
 548    %hash_list_to = ();
 549    @list_to = ();
 550    @scm = ();
 551    @web = ();
 552    @subsystem = ();
 553    @status = ();
 554    %deduplicate_name_hash = ();
 555    %deduplicate_address_hash = ();
 556    if ($email_git_all_signature_types) {
 557	$signature_pattern = "(.+?)[Bb][Yy]:";
 558    } else {
 559	$signature_pattern = "\(" . join("|", @signature_tags) . "\)";
 560    }
 561
 562    # Find responsible parties
 563
 564    my %exact_pattern_match_hash = ();
 565
 566    foreach my $file (@files) {
 567
 568	my %hash;
 569	my $tvi = find_first_section();
 570	while ($tvi < @typevalue) {
 571	    my $start = find_starting_index($tvi);
 572	    my $end = find_ending_index($tvi);
 573	    my $exclude = 0;
 574	    my $i;
 575
 576	    #Do not match excluded file patterns
 577
 578	    for ($i = $start; $i < $end; $i++) {
 579		my $line = $typevalue[$i];
 580		if ($line =~ m/^(\C):\s*(.*)/) {
 581		    my $type = $1;
 582		    my $value = $2;
 583		    if ($type eq 'X') {
 584			if (file_match_pattern($file, $value)) {
 585			    $exclude = 1;
 586			    last;
 587			}
 588		    }
 589		}
 590	    }
 591
 592	    if (!$exclude) {
 593		for ($i = $start; $i < $end; $i++) {
 594		    my $line = $typevalue[$i];
 595		    if ($line =~ m/^(\C):\s*(.*)/) {
 596			my $type = $1;
 597			my $value = $2;
 598			if ($type eq 'F') {
 599			    if (file_match_pattern($file, $value)) {
 600				my $value_pd = ($value =~ tr@/@@);
 601				my $file_pd = ($file  =~ tr@/@@);
 602				$value_pd++ if (substr($value,-1,1) ne "/");
 603				$value_pd = -1 if ($value =~ /^\.\*/);
 604				if ($value_pd >= $file_pd &&
 605				    range_is_maintained($start, $end) &&
 606				    range_has_maintainer($start, $end)) {
 607				    $exact_pattern_match_hash{$file} = 1;
 608				}
 609				if ($pattern_depth == 0 ||
 610				    (($file_pd - $value_pd) < $pattern_depth)) {
 611				    $hash{$tvi} = $value_pd;
 612				}
 613			    }
 
 
 
 
 614			}
 615		    }
 616		}
 617	    }
 618	    $tvi = $end + 1;
 619	}
 620
 621	foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
 622	    add_categories($line);
 623	    if ($sections) {
 624		my $i;
 625		my $start = find_starting_index($line);
 626		my $end = find_ending_index($line);
 627		for ($i = $start; $i < $end; $i++) {
 628		    my $line = $typevalue[$i];
 629		    if ($line =~ /^[FX]:/) {		##Restore file patterns
 630			$line =~ s/([^\\])\.([^\*])/$1\?$2/g;
 631			$line =~ s/([^\\])\.$/$1\?/g;	##Convert . back to ?
 632			$line =~ s/\\\./\./g;       	##Convert \. to .
 633			$line =~ s/\.\*/\*/g;       	##Convert .* to *
 634		    }
 635		    $line =~ s/^([A-Z]):/$1:\t/g;
 636		    print("$line\n");
 
 
 637		}
 638		print("\n");
 639	    }
 640	}
 
 
 641    }
 642
 643    if ($keywords) {
 644	@keyword_tvi = sort_and_uniq(@keyword_tvi);
 645	foreach my $line (@keyword_tvi) {
 646	    add_categories($line);
 647	}
 648    }
 649
 650    foreach my $email (@email_to, @list_to) {
 651	$email->[0] = deduplicate_email($email->[0]);
 652    }
 653
 654    foreach my $file (@files) {
 655	if ($email &&
 656	    ($email_git || ($email_git_fallback &&
 657			    !$exact_pattern_match_hash{$file}))) {
 
 
 658	    vcs_file_signoffs($file);
 659	}
 660	if ($email && $email_git_blame) {
 661	    vcs_file_blame($file);
 662	}
 663    }
 664
 665    if ($email) {
 666	foreach my $chief (@penguin_chief) {
 667	    if ($chief =~ m/^(.*):(.*)/) {
 668		my $email_address;
 669
 670		$email_address = format_email($1, $2, $email_usename);
 671		if ($email_git_penguin_chiefs) {
 672		    push(@email_to, [$email_address, 'chief penguin']);
 673		} else {
 674		    @email_to = grep($_->[0] !~ /${email_address}/, @email_to);
 675		}
 676	    }
 677	}
 678
 679	foreach my $email (@file_emails) {
 
 680	    my ($name, $address) = parse_email($email);
 681
 682	    my $tmp_email = format_email($name, $address, $email_usename);
 683	    push_email_address($tmp_email, '');
 684	    add_role($tmp_email, 'in file');
 685	}
 686    }
 687
 
 
 
 
 688    my @to = ();
 689    if ($email || $email_list) {
 690	if ($email) {
 691	    @to = (@to, @email_to);
 692	}
 693	if ($email_list) {
 694	    @to = (@to, @list_to);
 695	}
 696    }
 697
 698    if ($interactive) {
 699	@to = interactive_get_maintainers(\@to);
 700    }
 701
 702    return @to;
 703}
 704
 705sub file_match_pattern {
 706    my ($file, $pattern) = @_;
 707    if (substr($pattern, -1) eq "/") {
 708	if ($file =~ m@^$pattern@) {
 709	    return 1;
 710	}
 711    } else {
 712	if ($file =~ m@^$pattern@) {
 713	    my $s1 = ($file =~ tr@/@@);
 714	    my $s2 = ($pattern =~ tr@/@@);
 715	    if ($s1 == $s2) {
 716		return 1;
 717	    }
 718	}
 719    }
 720    return 0;
 721}
 722
 723sub usage {
 724    print <<EOT;
 725usage: $P [options] patchfile
 726       $P [options] -f file|directory
 727version: $V
 728
 729MAINTAINER field selection options:
 730  --email => print email address(es) if any
 731    --git => include recent git \*-by: signers
 732    --git-all-signature-types => include signers regardless of signature type
 733        or use only ${signature_pattern} signers (default: $email_git_all_signature_types)
 734    --git-fallback => use git when no exact MAINTAINERS pattern (default: $email_git_fallback)
 735    --git-chief-penguins => include ${penguin_chiefs}
 736    --git-min-signatures => number of signatures required (default: $email_git_min_signatures)
 737    --git-max-maintainers => maximum maintainers to add (default: $email_git_max_maintainers)
 738    --git-min-percent => minimum percentage of commits required (default: $email_git_min_percent)
 739    --git-blame => use git blame to find modified commits for patch or file
 
 740    --git-since => git history to use (default: $email_git_since)
 741    --hg-since => hg history to use (default: $email_hg_since)
 742    --interactive => display a menu (mostly useful if used with the --git option)
 743    --m => include maintainer(s) if any
 
 744    --n => include name 'Full Name <addr\@domain.tld>'
 745    --l => include list(s) if any
 746    --s => include subscriber only list(s) if any
 
 747    --remove-duplicates => minimize duplicate email names/addresses
 748    --roles => show roles (status:subsystem, git-signer, list, etc...)
 749    --rolestats => show roles and statistics (commits/total_commits, %)
 750    --file-emails => add email addresses found in -f file (default: 0 (off))
 
 751  --scm => print SCM tree(s) if any
 752  --status => print status if any
 753  --subsystem => print subsystem name if any
 754  --web => print website(s) if any
 755
 756Output type options:
 757  --separator [, ] => separator for multiple entries on 1 line
 758    using --separator also sets --nomultiline if --separator is not [, ]
 759  --multiline => print 1 entry per line
 760
 761Other options:
 762  --pattern-depth => Number of pattern directory traversals (default: 0 (all))
 763  --keywords => scan patch for keywords (default: $keywords)
 
 764  --sections => print all of the subsystem sections with pattern matches
 
 765  --mailmap => use .mailmap file (default: $email_use_mailmap)
 
 
 766  --version => show version
 767  --help => show this help information
 768
 769Default options:
 770  [--email --nogit --git-fallback --m --n --l --multiline -pattern-depth=0
 771   --remove-duplicates --rolestats]
 772
 773Notes:
 774  Using "-f directory" may give unexpected results:
 775      Used with "--git", git signators for _all_ files in and below
 776          directory are examined as git recurses directories.
 777          Any specified X: (exclude) pattern matches are _not_ ignored.
 778      Used with "--nogit", directory is used as a pattern match,
 779          no individual file within the directory or subdirectory
 780          is matched.
 781      Used with "--git-blame", does not iterate all files in directory
 782  Using "--git-blame" is slow and may add old committers and authors
 783      that are no longer active maintainers to the output.
 784  Using "--roles" or "--rolestats" with git send-email --cc-cmd or any
 785      other automated tools that expect only ["name"] <email address>
 786      may not work because of additional output after <email address>.
 787  Using "--rolestats" and "--git-blame" shows the #/total=% commits,
 788      not the percentage of the entire file authored.  # of commits is
 789      not a good measure of amount of code authored.  1 major commit may
 790      contain a thousand lines, 5 trivial commits may modify a single line.
 791  If git is not installed, but mercurial (hg) is installed and an .hg
 792      repository exists, the following options apply to mercurial:
 793          --git,
 794          --git-min-signatures, --git-max-maintainers, --git-min-percent, and
 795          --git-blame
 796      Use --hg-since not --git-since to control date selection
 797  File ".get_maintainer.conf", if it exists in the linux kernel source root
 798      directory, can change whatever get_maintainer defaults are desired.
 799      Entries in this file can be any command line argument.
 800      This file is prepended to any additional command line arguments.
 801      Multiple lines and # comments are allowed.
 
 
 
 802EOT
 803}
 804
 805sub top_of_kernel_tree {
 806    my ($lk_path) = @_;
 807
 808    if ($lk_path ne "" && substr($lk_path,length($lk_path)-1,1) ne "/") {
 809	$lk_path .= "/";
 810    }
 811    if (   (-f "${lk_path}COPYING")
 812	&& (-f "${lk_path}CREDITS")
 813	&& (-f "${lk_path}Kbuild")
 814	&& (-f "${lk_path}MAINTAINERS")
 815	&& (-f "${lk_path}Makefile")
 816	&& (-f "${lk_path}README")
 817	&& (-d "${lk_path}Documentation")
 818	&& (-d "${lk_path}arch")
 819	&& (-d "${lk_path}include")
 820	&& (-d "${lk_path}drivers")
 821	&& (-d "${lk_path}fs")
 822	&& (-d "${lk_path}init")
 823	&& (-d "${lk_path}ipc")
 824	&& (-d "${lk_path}kernel")
 825	&& (-d "${lk_path}lib")
 826	&& (-d "${lk_path}scripts")) {
 827	return 1;
 828    }
 829    return 0;
 830}
 831
 
 
 
 
 
 
 
 
 
 
 
 832sub parse_email {
 833    my ($formatted_email) = @_;
 834
 835    my $name = "";
 836    my $address = "";
 837
 838    if ($formatted_email =~ /^([^<]+)<(.+\@.*)>.*$/) {
 839	$name = $1;
 840	$address = $2;
 841    } elsif ($formatted_email =~ /^\s*<(.+\@\S*)>.*$/) {
 842	$address = $1;
 843    } elsif ($formatted_email =~ /^(.+\@\S*).*$/) {
 844	$address = $1;
 845    }
 846
 847    $name =~ s/^\s+|\s+$//g;
 848    $name =~ s/^\"|\"$//g;
 
 849    $address =~ s/^\s+|\s+$//g;
 850
 851    if ($name =~ /[^\w \-]/i) {  	 ##has "must quote" chars
 852	$name =~ s/(?<!\\)"/\\"/g;       ##escape quotes
 853	$name = "\"$name\"";
 854    }
 855
 856    return ($name, $address);
 857}
 858
 859sub format_email {
 860    my ($name, $address, $usename) = @_;
 861
 862    my $formatted_email;
 863
 864    $name =~ s/^\s+|\s+$//g;
 865    $name =~ s/^\"|\"$//g;
 
 866    $address =~ s/^\s+|\s+$//g;
 867
 868    if ($name =~ /[^\w \-]/i) {          ##has "must quote" chars
 869	$name =~ s/(?<!\\)"/\\"/g;       ##escape quotes
 870	$name = "\"$name\"";
 871    }
 872
 873    if ($usename) {
 874	if ("$name" eq "") {
 875	    $formatted_email = "$address";
 876	} else {
 877	    $formatted_email = "$name <$address>";
 878	}
 879    } else {
 880	$formatted_email = $address;
 881    }
 882
 883    return $formatted_email;
 884}
 885
 886sub find_first_section {
 887    my $index = 0;
 888
 889    while ($index < @typevalue) {
 890	my $tv = $typevalue[$index];
 891	if (($tv =~ m/^(\C):\s*(.*)/)) {
 892	    last;
 893	}
 894	$index++;
 895    }
 896
 897    return $index;
 898}
 899
 900sub find_starting_index {
 901    my ($index) = @_;
 902
 903    while ($index > 0) {
 904	my $tv = $typevalue[$index];
 905	if (!($tv =~ m/^(\C):\s*(.*)/)) {
 906	    last;
 907	}
 908	$index--;
 909    }
 910
 911    return $index;
 912}
 913
 914sub find_ending_index {
 915    my ($index) = @_;
 916
 917    while ($index < @typevalue) {
 918	my $tv = $typevalue[$index];
 919	if (!($tv =~ m/^(\C):\s*(.*)/)) {
 920	    last;
 921	}
 922	$index++;
 923    }
 924
 925    return $index;
 926}
 927
 928sub get_maintainer_role {
 929    my ($index) = @_;
 930
 931    my $i;
 932    my $start = find_starting_index($index);
 933    my $end = find_ending_index($index);
 934
 935    my $role = "unknown";
 936    my $subsystem = $typevalue[$start];
 937    if (length($subsystem) > 20) {
 938	$subsystem = substr($subsystem, 0, 17);
 939	$subsystem =~ s/\s*$//;
 940	$subsystem = $subsystem . "...";
 941    }
 
 
 
 
 
 
 
 
 
 
 
 
 942
 943    for ($i = $start + 1; $i < $end; $i++) {
 944	my $tv = $typevalue[$i];
 945	if ($tv =~ m/^(\C):\s*(.*)/) {
 946	    my $ptype = $1;
 947	    my $pvalue = $2;
 948	    if ($ptype eq "S") {
 949		$role = $pvalue;
 950	    }
 951	}
 952    }
 953
 954    $role = lc($role);
 955    if      ($role eq "supported") {
 956	$role = "supporter";
 957    } elsif ($role eq "maintained") {
 958	$role = "maintainer";
 959    } elsif ($role eq "odd fixes") {
 960	$role = "odd fixer";
 961    } elsif ($role eq "orphan") {
 962	$role = "orphan minder";
 963    } elsif ($role eq "obsolete") {
 964	$role = "obsolete minder";
 965    } elsif ($role eq "buried alive in reporters") {
 966	$role = "chief penguin";
 967    }
 968
 969    return $role . ":" . $subsystem;
 970}
 971
 972sub get_list_role {
 973    my ($index) = @_;
 974
 975    my $i;
 976    my $start = find_starting_index($index);
 977    my $end = find_ending_index($index);
 978
 979    my $subsystem = $typevalue[$start];
 980    if (length($subsystem) > 20) {
 981	$subsystem = substr($subsystem, 0, 17);
 982	$subsystem =~ s/\s*$//;
 983	$subsystem = $subsystem . "...";
 984    }
 985
 986    if ($subsystem eq "THE REST") {
 987	$subsystem = "";
 988    }
 989
 990    return $subsystem;
 991}
 992
 993sub add_categories {
 994    my ($index) = @_;
 995
 996    my $i;
 997    my $start = find_starting_index($index);
 998    my $end = find_ending_index($index);
 999
1000    push(@subsystem, $typevalue[$start]);
1001
1002    for ($i = $start + 1; $i < $end; $i++) {
1003	my $tv = $typevalue[$i];
1004	if ($tv =~ m/^(\C):\s*(.*)/) {
1005	    my $ptype = $1;
1006	    my $pvalue = $2;
1007	    if ($ptype eq "L") {
1008		my $list_address = $pvalue;
1009		my $list_additional = "";
1010		my $list_role = get_list_role($i);
1011
1012		if ($list_role ne "") {
1013		    $list_role = ":" . $list_role;
1014		}
1015		if ($list_address =~ m/([^\s]+)\s+(.*)$/) {
1016		    $list_address = $1;
1017		    $list_additional = $2;
1018		}
1019		if ($list_additional =~ m/subscribers-only/) {
1020		    if ($email_subscriber_list) {
1021			if (!$hash_list_to{lc($list_address)}) {
1022			    $hash_list_to{lc($list_address)} = 1;
1023			    push(@list_to, [$list_address,
1024					    "subscriber list${list_role}"]);
1025			}
1026		    }
1027		} else {
1028		    if ($email_list) {
1029			if (!$hash_list_to{lc($list_address)}) {
1030			    $hash_list_to{lc($list_address)} = 1;
1031			    if ($list_additional =~ m/moderated/) {
1032				push(@list_to, [$list_address,
1033						"moderated list${list_role}"]);
 
 
 
1034			    } else {
 
1035				push(@list_to, [$list_address,
1036						"open list${list_role}"]);
1037			    }
1038			}
1039		    }
1040		}
1041	    } elsif ($ptype eq "M") {
1042		my ($name, $address) = parse_email($pvalue);
1043		if ($name eq "") {
1044		    if ($i > 0) {
1045			my $tv = $typevalue[$i - 1];
1046			if ($tv =~ m/^(\C):\s*(.*)/) {
1047			    if ($1 eq "P") {
1048				$name = $2;
1049				$pvalue = format_email($name, $address, $email_usename);
1050			    }
1051			}
1052		    }
1053		}
1054		if ($email_maintainer) {
1055		    my $role = get_maintainer_role($i);
1056		    push_email_addresses($pvalue, $role);
 
 
 
 
 
1057		}
1058	    } elsif ($ptype eq "T") {
1059		push(@scm, $pvalue);
1060	    } elsif ($ptype eq "W") {
1061		push(@web, $pvalue);
1062	    } elsif ($ptype eq "S") {
1063		push(@status, $pvalue);
1064	    }
1065	}
1066    }
1067}
1068
1069sub email_inuse {
1070    my ($name, $address) = @_;
1071
1072    return 1 if (($name eq "") && ($address eq ""));
1073    return 1 if (($name ne "") && exists($email_hash_name{lc($name)}));
1074    return 1 if (($address ne "") && exists($email_hash_address{lc($address)}));
1075
1076    return 0;
1077}
1078
1079sub push_email_address {
1080    my ($line, $role) = @_;
1081
1082    my ($name, $address) = parse_email($line);
1083
1084    if ($address eq "") {
1085	return 0;
1086    }
1087
1088    if (!$email_remove_duplicates) {
1089	push(@email_to, [format_email($name, $address, $email_usename), $role]);
1090    } elsif (!email_inuse($name, $address)) {
1091	push(@email_to, [format_email($name, $address, $email_usename), $role]);
1092	$email_hash_name{lc($name)}++ if ($name ne "");
1093	$email_hash_address{lc($address)}++;
1094    }
1095
1096    return 1;
1097}
1098
1099sub push_email_addresses {
1100    my ($address, $role) = @_;
1101
1102    my @address_list = ();
1103
1104    if (rfc822_valid($address)) {
1105	push_email_address($address, $role);
1106    } elsif (@address_list = rfc822_validlist($address)) {
1107	my $array_count = shift(@address_list);
1108	while (my $entry = shift(@address_list)) {
1109	    push_email_address($entry, $role);
1110	}
1111    } else {
1112	if (!push_email_address($address, $role)) {
1113	    warn("Invalid MAINTAINERS address: '" . $address . "'\n");
1114	}
1115    }
1116}
1117
1118sub add_role {
1119    my ($line, $role) = @_;
1120
1121    my ($name, $address) = parse_email($line);
1122    my $email = format_email($name, $address, $email_usename);
1123
1124    foreach my $entry (@email_to) {
1125	if ($email_remove_duplicates) {
1126	    my ($entry_name, $entry_address) = parse_email($entry->[0]);
1127	    if (($name eq $entry_name || $address eq $entry_address)
1128		&& ($role eq "" || !($entry->[1] =~ m/$role/))
1129	    ) {
1130		if ($entry->[1] eq "") {
1131		    $entry->[1] = "$role";
1132		} else {
1133		    $entry->[1] = "$entry->[1],$role";
1134		}
1135	    }
1136	} else {
1137	    if ($email eq $entry->[0]
1138		&& ($role eq "" || !($entry->[1] =~ m/$role/))
1139	    ) {
1140		if ($entry->[1] eq "") {
1141		    $entry->[1] = "$role";
1142		} else {
1143		    $entry->[1] = "$entry->[1],$role";
1144		}
1145	    }
1146	}
1147    }
1148}
1149
1150sub which {
1151    my ($bin) = @_;
1152
1153    foreach my $path (split(/:/, $ENV{PATH})) {
1154	if (-e "$path/$bin") {
1155	    return "$path/$bin";
1156	}
1157    }
1158
1159    return "";
1160}
1161
1162sub which_conf {
1163    my ($conf) = @_;
1164
1165    foreach my $path (split(/:/, ".:$ENV{HOME}:.scripts")) {
1166	if (-e "$path/$conf") {
1167	    return "$path/$conf";
1168	}
1169    }
1170
1171    return "";
1172}
1173
1174sub mailmap_email {
1175    my ($line) = @_;
1176
1177    my ($name, $address) = parse_email($line);
1178    my $email = format_email($name, $address, 1);
1179    my $real_name = $name;
1180    my $real_address = $address;
1181
1182    if (exists $mailmap->{names}->{$email} ||
1183	exists $mailmap->{addresses}->{$email}) {
1184	if (exists $mailmap->{names}->{$email}) {
1185	    $real_name = $mailmap->{names}->{$email};
1186	}
1187	if (exists $mailmap->{addresses}->{$email}) {
1188	    $real_address = $mailmap->{addresses}->{$email};
1189	}
1190    } else {
1191	if (exists $mailmap->{names}->{$address}) {
1192	    $real_name = $mailmap->{names}->{$address};
1193	}
1194	if (exists $mailmap->{addresses}->{$address}) {
1195	    $real_address = $mailmap->{addresses}->{$address};
1196	}
1197    }
1198    return format_email($real_name, $real_address, 1);
1199}
1200
1201sub mailmap {
1202    my (@addresses) = @_;
1203
1204    my @mapped_emails = ();
1205    foreach my $line (@addresses) {
1206	push(@mapped_emails, mailmap_email($line));
1207    }
1208    merge_by_realname(@mapped_emails) if ($email_use_mailmap);
1209    return @mapped_emails;
1210}
1211
1212sub merge_by_realname {
1213    my %address_map;
1214    my (@emails) = @_;
1215
1216    foreach my $email (@emails) {
1217	my ($name, $address) = parse_email($email);
1218	if (exists $address_map{$name}) {
1219	    $address = $address_map{$name};
1220	    $email = format_email($name, $address, 1);
1221	} else {
1222	    $address_map{$name} = $address;
1223	}
1224    }
1225}
1226
1227sub git_execute_cmd {
1228    my ($cmd) = @_;
1229    my @lines = ();
1230
1231    my $output = `$cmd`;
1232    $output =~ s/^\s*//gm;
1233    @lines = split("\n", $output);
1234
1235    return @lines;
1236}
1237
1238sub hg_execute_cmd {
1239    my ($cmd) = @_;
1240    my @lines = ();
1241
1242    my $output = `$cmd`;
1243    @lines = split("\n", $output);
1244
1245    return @lines;
1246}
1247
1248sub extract_formatted_signatures {
1249    my (@signature_lines) = @_;
1250
1251    my @type = @signature_lines;
1252
1253    s/\s*(.*):.*/$1/ for (@type);
1254
1255    # cut -f2- -d":"
1256    s/\s*.*:\s*(.+)\s*/$1/ for (@signature_lines);
1257
1258## Reformat email addresses (with names) to avoid badly written signatures
1259
1260    foreach my $signer (@signature_lines) {
1261	$signer = deduplicate_email($signer);
1262    }
1263
1264    return (\@type, \@signature_lines);
1265}
1266
1267sub vcs_find_signers {
1268    my ($cmd) = @_;
1269    my $commits;
1270    my @lines = ();
1271    my @signatures = ();
 
 
1272
1273    @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1274
1275    my $pattern = $VCS_cmds{"commit_pattern"};
 
 
 
 
1276
1277    $commits = grep(/$pattern/, @lines);	# of commits
1278
 
1279    @signatures = grep(/^[ \t]*${signature_pattern}.*\@.*$/, @lines);
 
 
 
1280
1281    return (0, @signatures) if !@signatures;
1282
1283    save_commits_by_author(@lines) if ($interactive);
1284    save_commits_by_signer(@lines) if ($interactive);
1285
1286    if (!$email_git_penguin_chiefs) {
1287	@signatures = grep(!/${penguin_chiefs}/i, @signatures);
1288    }
1289
 
1290    my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
1291
1292    return ($commits, @$signers_ref);
1293}
1294
1295sub vcs_find_author {
1296    my ($cmd) = @_;
1297    my @lines = ();
1298
1299    @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1300
1301    if (!$email_git_penguin_chiefs) {
1302	@lines = grep(!/${penguin_chiefs}/i, @lines);
1303    }
1304
1305    return @lines if !@lines;
1306
1307    my @authors = ();
1308    foreach my $line (@lines) {
1309	if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1310	    my $author = $1;
1311	    my ($name, $address) = parse_email($author);
1312	    $author = format_email($name, $address, 1);
1313	    push(@authors, $author);
1314	}
1315    }
1316
1317    save_commits_by_author(@lines) if ($interactive);
1318    save_commits_by_signer(@lines) if ($interactive);
1319
1320    return @authors;
1321}
1322
1323sub vcs_save_commits {
1324    my ($cmd) = @_;
1325    my @lines = ();
1326    my @commits = ();
1327
1328    @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1329
1330    foreach my $line (@lines) {
1331	if ($line =~ m/$VCS_cmds{"blame_commit_pattern"}/) {
1332	    push(@commits, $1);
1333	}
1334    }
1335
1336    return @commits;
1337}
1338
1339sub vcs_blame {
1340    my ($file) = @_;
1341    my $cmd;
1342    my @commits = ();
1343
1344    return @commits if (!(-f $file));
1345
1346    if (@range && $VCS_cmds{"blame_range_cmd"} eq "") {
1347	my @all_commits = ();
1348
1349	$cmd = $VCS_cmds{"blame_file_cmd"};
1350	$cmd =~ s/(\$\w+)/$1/eeg;		#interpolate $cmd
1351	@all_commits = vcs_save_commits($cmd);
1352
1353	foreach my $file_range_diff (@range) {
1354	    next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1355	    my $diff_file = $1;
1356	    my $diff_start = $2;
1357	    my $diff_length = $3;
1358	    next if ("$file" ne "$diff_file");
1359	    for (my $i = $diff_start; $i < $diff_start + $diff_length; $i++) {
1360		push(@commits, $all_commits[$i]);
1361	    }
1362	}
1363    } elsif (@range) {
1364	foreach my $file_range_diff (@range) {
1365	    next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1366	    my $diff_file = $1;
1367	    my $diff_start = $2;
1368	    my $diff_length = $3;
1369	    next if ("$file" ne "$diff_file");
1370	    $cmd = $VCS_cmds{"blame_range_cmd"};
1371	    $cmd =~ s/(\$\w+)/$1/eeg;		#interpolate $cmd
1372	    push(@commits, vcs_save_commits($cmd));
1373	}
1374    } else {
1375	$cmd = $VCS_cmds{"blame_file_cmd"};
1376	$cmd =~ s/(\$\w+)/$1/eeg;		#interpolate $cmd
1377	@commits = vcs_save_commits($cmd);
1378    }
1379
1380    foreach my $commit (@commits) {
1381	$commit =~ s/^\^//g;
1382    }
1383
1384    return @commits;
1385}
1386
1387my $printed_novcs = 0;
1388sub vcs_exists {
1389    %VCS_cmds = %VCS_cmds_git;
1390    return 1 if eval $VCS_cmds{"available"};
1391    %VCS_cmds = %VCS_cmds_hg;
1392    return 2 if eval $VCS_cmds{"available"};
1393    %VCS_cmds = ();
1394    if (!$printed_novcs) {
1395	warn("$P: No supported VCS found.  Add --nogit to options?\n");
1396	warn("Using a git repository produces better results.\n");
1397	warn("Try Linus Torvalds' latest git repository using:\n");
1398	warn("git clone git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git\n");
1399	$printed_novcs = 1;
1400    }
1401    return 0;
1402}
1403
1404sub vcs_is_git {
1405    vcs_exists();
1406    return $vcs_used == 1;
1407}
1408
1409sub vcs_is_hg {
1410    return $vcs_used == 2;
1411}
1412
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1413sub interactive_get_maintainers {
1414    my ($list_ref) = @_;
1415    my @list = @$list_ref;
1416
1417    vcs_exists();
1418
1419    my %selected;
1420    my %authored;
1421    my %signed;
1422    my $count = 0;
1423    my $maintained = 0;
1424    foreach my $entry (@list) {
1425	$maintained = 1 if ($entry->[1] =~ /^(maintainer|supporter)/i);
1426	$selected{$count} = 1;
1427	$authored{$count} = 0;
1428	$signed{$count} = 0;
1429	$count++;
1430    }
1431
1432    #menu loop
1433    my $done = 0;
1434    my $print_options = 0;
1435    my $redraw = 1;
1436    while (!$done) {
1437	$count = 0;
1438	if ($redraw) {
1439	    printf STDERR "\n%1s %2s %-65s",
1440			  "*", "#", "email/list and role:stats";
1441	    if ($email_git ||
1442		($email_git_fallback && !$maintained) ||
1443		$email_git_blame) {
1444		print STDERR "auth sign";
1445	    }
1446	    print STDERR "\n";
1447	    foreach my $entry (@list) {
1448		my $email = $entry->[0];
1449		my $role = $entry->[1];
1450		my $sel = "";
1451		$sel = "*" if ($selected{$count});
1452		my $commit_author = $commit_author_hash{$email};
1453		my $commit_signer = $commit_signer_hash{$email};
1454		my $authored = 0;
1455		my $signed = 0;
1456		$authored++ for (@{$commit_author});
1457		$signed++ for (@{$commit_signer});
1458		printf STDERR "%1s %2d %-65s", $sel, $count + 1, $email;
1459		printf STDERR "%4d %4d", $authored, $signed
1460		    if ($authored > 0 || $signed > 0);
1461		printf STDERR "\n     %s\n", $role;
1462		if ($authored{$count}) {
1463		    my $commit_author = $commit_author_hash{$email};
1464		    foreach my $ref (@{$commit_author}) {
1465			print STDERR "     Author: @{$ref}[1]\n";
1466		    }
1467		}
1468		if ($signed{$count}) {
1469		    my $commit_signer = $commit_signer_hash{$email};
1470		    foreach my $ref (@{$commit_signer}) {
1471			print STDERR "     @{$ref}[2]: @{$ref}[1]\n";
1472		    }
1473		}
1474
1475		$count++;
1476	    }
1477	}
1478	my $date_ref = \$email_git_since;
1479	$date_ref = \$email_hg_since if (vcs_is_hg());
1480	if ($print_options) {
1481	    $print_options = 0;
1482	    if (vcs_exists()) {
1483		print STDERR <<EOT
1484
1485Version Control options:
1486g  use git history      [$email_git]
1487gf use git-fallback     [$email_git_fallback]
1488b  use git blame        [$email_git_blame]
1489bs use blame signatures [$email_git_blame_signatures]
1490c# minimum commits      [$email_git_min_signatures]
1491%# min percent          [$email_git_min_percent]
1492d# history to use       [$$date_ref]
1493x# max maintainers      [$email_git_max_maintainers]
1494t  all signature types  [$email_git_all_signature_types]
1495m  use .mailmap         [$email_use_mailmap]
1496EOT
1497	    }
1498	    print STDERR <<EOT
1499
1500Additional options:
15010  toggle all
1502tm toggle maintainers
1503tg toggle git entries
1504tl toggle open list entries
1505ts toggle subscriber list entries
1506f  emails in file       [$file_emails]
1507k  keywords in file     [$keywords]
1508r  remove duplicates    [$email_remove_duplicates]
1509p# pattern match depth  [$pattern_depth]
1510EOT
1511	}
1512	print STDERR
1513"\n#(toggle), A#(author), S#(signed) *(all), ^(none), O(options), Y(approve): ";
1514
1515	my $input = <STDIN>;
1516	chomp($input);
1517
1518	$redraw = 1;
1519	my $rerun = 0;
1520	my @wish = split(/[, ]+/, $input);
1521	foreach my $nr (@wish) {
1522	    $nr = lc($nr);
1523	    my $sel = substr($nr, 0, 1);
1524	    my $str = substr($nr, 1);
1525	    my $val = 0;
1526	    $val = $1 if $str =~ /^(\d+)$/;
1527
1528	    if ($sel eq "y") {
1529		$interactive = 0;
1530		$done = 1;
1531		$output_rolestats = 0;
1532		$output_roles = 0;
1533		last;
1534	    } elsif ($nr =~ /^\d+$/ && $nr > 0 && $nr <= $count) {
1535		$selected{$nr - 1} = !$selected{$nr - 1};
1536	    } elsif ($sel eq "*" || $sel eq '^') {
1537		my $toggle = 0;
1538		$toggle = 1 if ($sel eq '*');
1539		for (my $i = 0; $i < $count; $i++) {
1540		    $selected{$i} = $toggle;
1541		}
1542	    } elsif ($sel eq "0") {
1543		for (my $i = 0; $i < $count; $i++) {
1544		    $selected{$i} = !$selected{$i};
1545		}
1546	    } elsif ($sel eq "t") {
1547		if (lc($str) eq "m") {
1548		    for (my $i = 0; $i < $count; $i++) {
1549			$selected{$i} = !$selected{$i}
1550			    if ($list[$i]->[1] =~ /^(maintainer|supporter)/i);
1551		    }
1552		} elsif (lc($str) eq "g") {
1553		    for (my $i = 0; $i < $count; $i++) {
1554			$selected{$i} = !$selected{$i}
1555			    if ($list[$i]->[1] =~ /^(author|commit|signer)/i);
1556		    }
1557		} elsif (lc($str) eq "l") {
1558		    for (my $i = 0; $i < $count; $i++) {
1559			$selected{$i} = !$selected{$i}
1560			    if ($list[$i]->[1] =~ /^(open list)/i);
1561		    }
1562		} elsif (lc($str) eq "s") {
1563		    for (my $i = 0; $i < $count; $i++) {
1564			$selected{$i} = !$selected{$i}
1565			    if ($list[$i]->[1] =~ /^(subscriber list)/i);
1566		    }
1567		}
1568	    } elsif ($sel eq "a") {
1569		if ($val > 0 && $val <= $count) {
1570		    $authored{$val - 1} = !$authored{$val - 1};
1571		} elsif ($str eq '*' || $str eq '^') {
1572		    my $toggle = 0;
1573		    $toggle = 1 if ($str eq '*');
1574		    for (my $i = 0; $i < $count; $i++) {
1575			$authored{$i} = $toggle;
1576		    }
1577		}
1578	    } elsif ($sel eq "s") {
1579		if ($val > 0 && $val <= $count) {
1580		    $signed{$val - 1} = !$signed{$val - 1};
1581		} elsif ($str eq '*' || $str eq '^') {
1582		    my $toggle = 0;
1583		    $toggle = 1 if ($str eq '*');
1584		    for (my $i = 0; $i < $count; $i++) {
1585			$signed{$i} = $toggle;
1586		    }
1587		}
1588	    } elsif ($sel eq "o") {
1589		$print_options = 1;
1590		$redraw = 1;
1591	    } elsif ($sel eq "g") {
1592		if ($str eq "f") {
1593		    bool_invert(\$email_git_fallback);
1594		} else {
1595		    bool_invert(\$email_git);
1596		}
1597		$rerun = 1;
1598	    } elsif ($sel eq "b") {
1599		if ($str eq "s") {
1600		    bool_invert(\$email_git_blame_signatures);
1601		} else {
1602		    bool_invert(\$email_git_blame);
1603		}
1604		$rerun = 1;
1605	    } elsif ($sel eq "c") {
1606		if ($val > 0) {
1607		    $email_git_min_signatures = $val;
1608		    $rerun = 1;
1609		}
1610	    } elsif ($sel eq "x") {
1611		if ($val > 0) {
1612		    $email_git_max_maintainers = $val;
1613		    $rerun = 1;
1614		}
1615	    } elsif ($sel eq "%") {
1616		if ($str ne "" && $val >= 0) {
1617		    $email_git_min_percent = $val;
1618		    $rerun = 1;
1619		}
1620	    } elsif ($sel eq "d") {
1621		if (vcs_is_git()) {
1622		    $email_git_since = $str;
1623		} elsif (vcs_is_hg()) {
1624		    $email_hg_since = $str;
1625		}
1626		$rerun = 1;
1627	    } elsif ($sel eq "t") {
1628		bool_invert(\$email_git_all_signature_types);
1629		$rerun = 1;
1630	    } elsif ($sel eq "f") {
1631		bool_invert(\$file_emails);
1632		$rerun = 1;
1633	    } elsif ($sel eq "r") {
1634		bool_invert(\$email_remove_duplicates);
1635		$rerun = 1;
1636	    } elsif ($sel eq "m") {
1637		bool_invert(\$email_use_mailmap);
1638		read_mailmap();
1639		$rerun = 1;
1640	    } elsif ($sel eq "k") {
1641		bool_invert(\$keywords);
1642		$rerun = 1;
1643	    } elsif ($sel eq "p") {
1644		if ($str ne "" && $val >= 0) {
1645		    $pattern_depth = $val;
1646		    $rerun = 1;
1647		}
1648	    } elsif ($sel eq "h" || $sel eq "?") {
1649		print STDERR <<EOT
1650
1651Interactive mode allows you to select the various maintainers, submitters,
1652commit signers and mailing lists that could be CC'd on a patch.
1653
1654Any *'d entry is selected.
1655
1656If you have git or hg installed, you can choose to summarize the commit
1657history of files in the patch.  Also, each line of the current file can
1658be matched to its commit author and that commits signers with blame.
1659
1660Various knobs exist to control the length of time for active commit
1661tracking, the maximum number of commit authors and signers to add,
1662and such.
1663
1664Enter selections at the prompt until you are satisfied that the selected
1665maintainers are appropriate.  You may enter multiple selections separated
1666by either commas or spaces.
1667
1668EOT
1669	    } else {
1670		print STDERR "invalid option: '$nr'\n";
1671		$redraw = 0;
1672	    }
1673	}
1674	if ($rerun) {
1675	    print STDERR "git-blame can be very slow, please have patience..."
1676		if ($email_git_blame);
1677	    goto &get_maintainers;
1678	}
1679    }
1680
1681    #drop not selected entries
1682    $count = 0;
1683    my @new_emailto = ();
1684    foreach my $entry (@list) {
1685	if ($selected{$count}) {
1686	    push(@new_emailto, $list[$count]);
1687	}
1688	$count++;
1689    }
1690    return @new_emailto;
1691}
1692
1693sub bool_invert {
1694    my ($bool_ref) = @_;
1695
1696    if ($$bool_ref) {
1697	$$bool_ref = 0;
1698    } else {
1699	$$bool_ref = 1;
1700    }
1701}
1702
1703sub deduplicate_email {
1704    my ($email) = @_;
1705
1706    my $matched = 0;
1707    my ($name, $address) = parse_email($email);
1708    $email = format_email($name, $address, 1);
1709    $email = mailmap_email($email);
1710
1711    return $email if (!$email_remove_duplicates);
1712
1713    ($name, $address) = parse_email($email);
1714
1715    if ($name ne "" && $deduplicate_name_hash{lc($name)}) {
1716	$name = $deduplicate_name_hash{lc($name)}->[0];
1717	$address = $deduplicate_name_hash{lc($name)}->[1];
1718	$matched = 1;
1719    } elsif ($deduplicate_address_hash{lc($address)}) {
1720	$name = $deduplicate_address_hash{lc($address)}->[0];
1721	$address = $deduplicate_address_hash{lc($address)}->[1];
1722	$matched = 1;
1723    }
1724    if (!$matched) {
1725	$deduplicate_name_hash{lc($name)} = [ $name, $address ];
1726	$deduplicate_address_hash{lc($address)} = [ $name, $address ];
1727    }
1728    $email = format_email($name, $address, 1);
1729    $email = mailmap_email($email);
1730    return $email;
1731}
1732
1733sub save_commits_by_author {
1734    my (@lines) = @_;
1735
1736    my @authors = ();
1737    my @commits = ();
1738    my @subjects = ();
1739
1740    foreach my $line (@lines) {
1741	if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1742	    my $author = $1;
1743	    $author = deduplicate_email($author);
1744	    push(@authors, $author);
1745	}
1746	push(@commits, $1) if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
1747	push(@subjects, $1) if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
1748    }
1749
1750    for (my $i = 0; $i < @authors; $i++) {
1751	my $exists = 0;
1752	foreach my $ref(@{$commit_author_hash{$authors[$i]}}) {
1753	    if (@{$ref}[0] eq $commits[$i] &&
1754		@{$ref}[1] eq $subjects[$i]) {
1755		$exists = 1;
1756		last;
1757	    }
1758	}
1759	if (!$exists) {
1760	    push(@{$commit_author_hash{$authors[$i]}},
1761		 [ ($commits[$i], $subjects[$i]) ]);
1762	}
1763    }
1764}
1765
1766sub save_commits_by_signer {
1767    my (@lines) = @_;
1768
1769    my $commit = "";
1770    my $subject = "";
1771
1772    foreach my $line (@lines) {
1773	$commit = $1 if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
1774	$subject = $1 if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
1775	if ($line =~ /^[ \t]*${signature_pattern}.*\@.*$/) {
1776	    my @signatures = ($line);
1777	    my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
1778	    my @types = @$types_ref;
1779	    my @signers = @$signers_ref;
1780
1781	    my $type = $types[0];
1782	    my $signer = $signers[0];
1783
1784	    $signer = deduplicate_email($signer);
1785
1786	    my $exists = 0;
1787	    foreach my $ref(@{$commit_signer_hash{$signer}}) {
1788		if (@{$ref}[0] eq $commit &&
1789		    @{$ref}[1] eq $subject &&
1790		    @{$ref}[2] eq $type) {
1791		    $exists = 1;
1792		    last;
1793		}
1794	    }
1795	    if (!$exists) {
1796		push(@{$commit_signer_hash{$signer}},
1797		     [ ($commit, $subject, $type) ]);
1798	    }
1799	}
1800    }
1801}
1802
1803sub vcs_assign {
1804    my ($role, $divisor, @lines) = @_;
1805
1806    my %hash;
1807    my $count = 0;
1808
1809    return if (@lines <= 0);
1810
1811    if ($divisor <= 0) {
1812	warn("Bad divisor in " . (caller(0))[3] . ": $divisor\n");
1813	$divisor = 1;
1814    }
1815
1816    @lines = mailmap(@lines);
1817
1818    return if (@lines <= 0);
1819
1820    @lines = sort(@lines);
1821
1822    # uniq -c
1823    $hash{$_}++ for @lines;
1824
1825    # sort -rn
1826    foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
1827	my $sign_offs = $hash{$line};
1828	my $percent = $sign_offs * 100 / $divisor;
1829
1830	$percent = 100 if ($percent > 100);
 
1831	$count++;
1832	last if ($sign_offs < $email_git_min_signatures ||
1833		 $count > $email_git_max_maintainers ||
1834		 $percent < $email_git_min_percent);
1835	push_email_address($line, '');
1836	if ($output_rolestats) {
1837	    my $fmt_percent = sprintf("%.0f", $percent);
1838	    add_role($line, "$role:$sign_offs/$divisor=$fmt_percent%");
1839	} else {
1840	    add_role($line, $role);
1841	}
1842    }
1843}
1844
1845sub vcs_file_signoffs {
1846    my ($file) = @_;
1847
 
 
 
 
1848    my @signers = ();
 
1849    my $commits;
1850
1851    $vcs_used = vcs_exists();
1852    return if (!$vcs_used);
1853
1854    my $cmd = $VCS_cmds{"find_signers_cmd"};
1855    $cmd =~ s/(\$\w+)/$1/eeg;		# interpolate $cmd
1856
1857    ($commits, @signers) = vcs_find_signers($cmd);
 
 
 
 
 
 
1858
1859    foreach my $signer (@signers) {
1860	$signer = deduplicate_email($signer);
1861    }
1862
1863    vcs_assign("commit_signer", $commits, @signers);
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1864}
1865
1866sub vcs_file_blame {
1867    my ($file) = @_;
1868
1869    my @signers = ();
1870    my @all_commits = ();
1871    my @commits = ();
1872    my $total_commits;
1873    my $total_lines;
1874
1875    $vcs_used = vcs_exists();
1876    return if (!$vcs_used);
1877
1878    @all_commits = vcs_blame($file);
1879    @commits = uniq(@all_commits);
1880    $total_commits = @commits;
1881    $total_lines = @all_commits;
1882
1883    if ($email_git_blame_signatures) {
1884	if (vcs_is_hg()) {
1885	    my $commit_count;
 
 
 
 
1886	    my @commit_signers = ();
1887	    my $commit = join(" -r ", @commits);
1888	    my $cmd;
1889
1890	    $cmd = $VCS_cmds{"find_commit_signers_cmd"};
1891	    $cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
1892
1893	    ($commit_count, @commit_signers) = vcs_find_signers($cmd);
 
 
1894
1895	    push(@signers, @commit_signers);
1896	} else {
1897	    foreach my $commit (@commits) {
1898		my $commit_count;
 
 
 
 
1899		my @commit_signers = ();
1900		my $cmd;
1901
1902		$cmd = $VCS_cmds{"find_commit_signers_cmd"};
1903		$cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
1904
1905		($commit_count, @commit_signers) = vcs_find_signers($cmd);
 
 
1906
1907		push(@signers, @commit_signers);
1908	    }
1909	}
1910    }
1911
1912    if ($from_filename) {
1913	if ($output_rolestats) {
1914	    my @blame_signers;
1915	    if (vcs_is_hg()) {{		# Double brace for last exit
1916		my $commit_count;
1917		my @commit_signers = ();
1918		@commits = uniq(@commits);
1919		@commits = sort(@commits);
1920		my $commit = join(" -r ", @commits);
1921		my $cmd;
1922
1923		$cmd = $VCS_cmds{"find_commit_author_cmd"};
1924		$cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
1925
1926		my @lines = ();
1927
1928		@lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1929
1930		if (!$email_git_penguin_chiefs) {
1931		    @lines = grep(!/${penguin_chiefs}/i, @lines);
1932		}
1933
1934		last if !@lines;
1935
1936		my @authors = ();
1937		foreach my $line (@lines) {
1938		    if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1939			my $author = $1;
1940			$author = deduplicate_email($author);
1941			push(@authors, $author);
1942		    }
1943		}
1944
1945		save_commits_by_author(@lines) if ($interactive);
1946		save_commits_by_signer(@lines) if ($interactive);
1947
1948		push(@signers, @authors);
1949	    }}
1950	    else {
1951		foreach my $commit (@commits) {
1952		    my $i;
1953		    my $cmd = $VCS_cmds{"find_commit_author_cmd"};
1954		    $cmd =~ s/(\$\w+)/$1/eeg;	#interpolate $cmd
1955		    my @author = vcs_find_author($cmd);
1956		    next if !@author;
1957
1958		    my $formatted_author = deduplicate_email($author[0]);
1959
1960		    my $count = grep(/$commit/, @all_commits);
1961		    for ($i = 0; $i < $count ; $i++) {
1962			push(@blame_signers, $formatted_author);
1963		    }
1964		}
1965	    }
1966	    if (@blame_signers) {
1967		vcs_assign("authored lines", $total_lines, @blame_signers);
1968	    }
1969	}
1970	foreach my $signer (@signers) {
1971	    $signer = deduplicate_email($signer);
1972	}
1973	vcs_assign("commits", $total_commits, @signers);
1974    } else {
1975	foreach my $signer (@signers) {
1976	    $signer = deduplicate_email($signer);
1977	}
1978	vcs_assign("modified commits", $total_commits, @signers);
1979    }
1980}
1981
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1982sub uniq {
1983    my (@parms) = @_;
1984
1985    my %saw;
1986    @parms = grep(!$saw{$_}++, @parms);
1987    return @parms;
1988}
1989
1990sub sort_and_uniq {
1991    my (@parms) = @_;
1992
1993    my %saw;
1994    @parms = sort @parms;
1995    @parms = grep(!$saw{$_}++, @parms);
1996    return @parms;
1997}
1998
1999sub clean_file_emails {
2000    my (@file_emails) = @_;
2001    my @fmt_emails = ();
2002
2003    foreach my $email (@file_emails) {
2004	$email =~ s/[\(\<\{]{0,1}([A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+)[\)\>\}]{0,1}/\<$1\>/g;
2005	my ($name, $address) = parse_email($email);
2006	if ($name eq '"[,\.]"') {
2007	    $name = "";
2008	}
2009
2010	my @nw = split(/[^A-Za-zÀ-ÿ\'\,\.\+-]/, $name);
 
 
 
 
 
 
 
 
 
2011	if (@nw > 2) {
2012	    my $first = $nw[@nw - 3];
2013	    my $middle = $nw[@nw - 2];
2014	    my $last = $nw[@nw - 1];
2015
2016	    if (((length($first) == 1 && $first =~ m/[A-Za-z]/) ||
2017		 (length($first) == 2 && substr($first, -1) eq ".")) ||
2018		(length($middle) == 1 ||
2019		 (length($middle) == 2 && substr($middle, -1) eq "."))) {
2020		$name = "$first $middle $last";
2021	    } else {
2022		$name = "$middle $last";
2023	    }
 
 
2024	}
2025
2026	if (substr($name, -1) =~ /[,\.]/) {
2027	    $name = substr($name, 0, length($name) - 1);
2028	} elsif (substr($name, -2) =~ /[,\.]"/) {
2029	    $name = substr($name, 0, length($name) - 2) . '"';
2030	}
2031
2032	if (substr($name, 0, 1) =~ /[,\.]/) {
2033	    $name = substr($name, 1, length($name) - 1);
2034	} elsif (substr($name, 0, 2) =~ /"[,\.]/) {
2035	    $name = '"' . substr($name, 2, length($name) - 2);
2036	}
2037
2038	my $fmt_email = format_email($name, $address, $email_usename);
2039	push(@fmt_emails, $fmt_email);
2040    }
2041    return @fmt_emails;
2042}
2043
2044sub merge_email {
2045    my @lines;
2046    my %saw;
2047
2048    for (@_) {
2049	my ($address, $role) = @$_;
2050	if (!$saw{$address}) {
2051	    if ($output_roles) {
2052		push(@lines, "$address ($role)");
2053	    } else {
2054		push(@lines, $address);
2055	    }
2056	    $saw{$address} = 1;
2057	}
2058    }
2059
2060    return @lines;
2061}
2062
2063sub output {
2064    my (@parms) = @_;
2065
2066    if ($output_multiline) {
2067	foreach my $line (@parms) {
2068	    print("${line}\n");
2069	}
2070    } else {
2071	print(join($output_separator, @parms));
2072	print("\n");
2073    }
2074}
2075
2076my $rfc822re;
2077
2078sub make_rfc822re {
2079#   Basic lexical tokens are specials, domain_literal, quoted_string, atom, and
2080#   comment.  We must allow for rfc822_lwsp (or comments) after each of these.
2081#   This regexp will only work on addresses which have had comments stripped
2082#   and replaced with rfc822_lwsp.
2083
2084    my $specials = '()<>@,;:\\\\".\\[\\]';
2085    my $controls = '\\000-\\037\\177';
2086
2087    my $dtext = "[^\\[\\]\\r\\\\]";
2088    my $domain_literal = "\\[(?:$dtext|\\\\.)*\\]$rfc822_lwsp*";
2089
2090    my $quoted_string = "\"(?:[^\\\"\\r\\\\]|\\\\.|$rfc822_lwsp)*\"$rfc822_lwsp*";
2091
2092#   Use zero-width assertion to spot the limit of an atom.  A simple
2093#   $rfc822_lwsp* causes the regexp engine to hang occasionally.
2094    my $atom = "[^$specials $controls]+(?:$rfc822_lwsp+|\\Z|(?=[\\[\"$specials]))";
2095    my $word = "(?:$atom|$quoted_string)";
2096    my $localpart = "$word(?:\\.$rfc822_lwsp*$word)*";
2097
2098    my $sub_domain = "(?:$atom|$domain_literal)";
2099    my $domain = "$sub_domain(?:\\.$rfc822_lwsp*$sub_domain)*";
2100
2101    my $addr_spec = "$localpart\@$rfc822_lwsp*$domain";
2102
2103    my $phrase = "$word*";
2104    my $route = "(?:\@$domain(?:,\@$rfc822_lwsp*$domain)*:$rfc822_lwsp*)";
2105    my $route_addr = "\\<$rfc822_lwsp*$route?$addr_spec\\>$rfc822_lwsp*";
2106    my $mailbox = "(?:$addr_spec|$phrase$route_addr)";
2107
2108    my $group = "$phrase:$rfc822_lwsp*(?:$mailbox(?:,\\s*$mailbox)*)?;\\s*";
2109    my $address = "(?:$mailbox|$group)";
2110
2111    return "$rfc822_lwsp*$address";
2112}
2113
2114sub rfc822_strip_comments {
2115    my $s = shift;
2116#   Recursively remove comments, and replace with a single space.  The simpler
2117#   regexps in the Email Addressing FAQ are imperfect - they will miss escaped
2118#   chars in atoms, for example.
2119
2120    while ($s =~ s/^((?:[^"\\]|\\.)*
2121                    (?:"(?:[^"\\]|\\.)*"(?:[^"\\]|\\.)*)*)
2122                    \((?:[^()\\]|\\.)*\)/$1 /osx) {}
2123    return $s;
2124}
2125
2126#   valid: returns true if the parameter is an RFC822 valid address
2127#
2128sub rfc822_valid {
2129    my $s = rfc822_strip_comments(shift);
2130
2131    if (!$rfc822re) {
2132        $rfc822re = make_rfc822re();
2133    }
2134
2135    return $s =~ m/^$rfc822re$/so && $s =~ m/^$rfc822_char*$/;
2136}
2137
2138#   validlist: In scalar context, returns true if the parameter is an RFC822
2139#              valid list of addresses.
2140#
2141#              In list context, returns an empty list on failure (an invalid
2142#              address was found); otherwise a list whose first element is the
2143#              number of addresses found and whose remaining elements are the
2144#              addresses.  This is needed to disambiguate failure (invalid)
2145#              from success with no addresses found, because an empty string is
2146#              a valid list.
2147
2148sub rfc822_validlist {
2149    my $s = rfc822_strip_comments(shift);
2150
2151    if (!$rfc822re) {
2152        $rfc822re = make_rfc822re();
2153    }
2154    # * null list items are valid according to the RFC
2155    # * the '1' business is to aid in distinguishing failure from no results
2156
2157    my @r;
2158    if ($s =~ m/^(?:$rfc822re)?(?:,(?:$rfc822re)?)*$/so &&
2159	$s =~ m/^$rfc822_char*$/) {
2160        while ($s =~ m/(?:^|,$rfc822_lwsp*)($rfc822re)/gos) {
2161            push(@r, $1);
2162        }
2163        return wantarray ? (scalar(@r), @r) : 1;
2164    }
2165    return wantarray ? () : 0;
2166}
v6.8
   1#!/usr/bin/env perl
   2# SPDX-License-Identifier: GPL-2.0
   3#
   4# (c) 2007, Joe Perches <joe@perches.com>
   5#           created from checkpatch.pl
   6#
   7# Print selected MAINTAINERS information for
   8# the files modified in a patch or for a file
   9#
  10# usage: perl scripts/get_maintainer.pl [OPTIONS] <patch>
  11#        perl scripts/get_maintainer.pl [OPTIONS] -f <file>
 
 
  12
  13use warnings;
  14use strict;
  15
  16my $P = $0;
  17my $V = '0.26';
  18
  19use Getopt::Long qw(:config no_auto_abbrev);
  20use Cwd;
  21use File::Find;
  22use File::Spec::Functions;
  23use open qw(:std :encoding(UTF-8));
  24
  25my $cur_path = fastgetcwd() . '/';
  26my $lk_path = "./";
  27my $email = 1;
  28my $email_usename = 1;
  29my $email_maintainer = 1;
  30my $email_reviewer = 1;
  31my $email_fixes = 1;
  32my $email_list = 1;
  33my $email_moderated_list = 1;
  34my $email_subscriber_list = 0;
  35my $email_git_penguin_chiefs = 0;
  36my $email_git = 0;
  37my $email_git_all_signature_types = 0;
  38my $email_git_blame = 0;
  39my $email_git_blame_signatures = 1;
  40my $email_git_fallback = 1;
  41my $email_git_min_signatures = 1;
  42my $email_git_max_maintainers = 5;
  43my $email_git_min_percent = 5;
  44my $email_git_since = "1-year-ago";
  45my $email_hg_since = "-365";
  46my $interactive = 0;
  47my $email_remove_duplicates = 1;
  48my $email_use_mailmap = 1;
  49my $output_multiline = 1;
  50my $output_separator = ", ";
  51my $output_roles = 0;
  52my $output_rolestats = 1;
  53my $output_section_maxlen = 50;
  54my $scm = 0;
  55my $tree = 1;
  56my $web = 0;
  57my $subsystem = 0;
  58my $status = 0;
  59my $letters = "";
  60my $keywords = 1;
  61my $keywords_in_file = 0;
  62my $sections = 0;
  63my $email_file_emails = 0;
  64my $from_filename = 0;
  65my $pattern_depth = 0;
  66my $self_test = undef;
  67my $version = 0;
  68my $help = 0;
  69my $find_maintainer_files = 0;
  70my $maintainer_path;
  71my $vcs_used = 0;
  72
  73my $exit = 0;
  74
  75my @files = ();
  76my @fixes = ();			# If a patch description includes Fixes: lines
  77my @range = ();
  78my @keyword_tvi = ();
  79my @file_emails = ();
  80
  81my %commit_author_hash;
  82my %commit_signer_hash;
  83
  84my @penguin_chief = ();
  85push(@penguin_chief, "Linus Torvalds:torvalds\@linux-foundation.org");
  86#Andrew wants in on most everything - 2009/01/14
  87#push(@penguin_chief, "Andrew Morton:akpm\@linux-foundation.org");
  88
  89my @penguin_chief_names = ();
  90foreach my $chief (@penguin_chief) {
  91    if ($chief =~ m/^(.*):(.*)/) {
  92	my $chief_name = $1;
  93	my $chief_addr = $2;
  94	push(@penguin_chief_names, $chief_name);
  95    }
  96}
  97my $penguin_chiefs = "\(" . join("|", @penguin_chief_names) . "\)";
  98
  99# Signature types of people who are either
 100# 	a) responsible for the code in question, or
 101# 	b) familiar enough with it to give relevant feedback
 102my @signature_tags = ();
 103push(@signature_tags, "Signed-off-by:");
 104push(@signature_tags, "Reviewed-by:");
 105push(@signature_tags, "Acked-by:");
 106
 107my $signature_pattern = "\(" . join("|", @signature_tags) . "\)";
 108
 109# rfc822 email address - preloaded methods go here.
 110my $rfc822_lwsp = "(?:(?:\\r\\n)?[ \\t])";
 111my $rfc822_char = '[\\000-\\377]';
 112
 113# VCS command support: class-like functions and strings
 114
 115my %VCS_cmds;
 116
 117my %VCS_cmds_git = (
 118    "execute_cmd" => \&git_execute_cmd,
 119    "available" => '(which("git") ne "") && (-e ".git")',
 120    "find_signers_cmd" =>
 121	"git log --no-color --follow --since=\$email_git_since " .
 122	    '--numstat --no-merges ' .
 123	    '--format="GitCommit: %H%n' .
 124		      'GitAuthor: %an <%ae>%n' .
 125		      'GitDate: %aD%n' .
 126		      'GitSubject: %s%n' .
 127		      '%b%n"' .
 128	    " -- \$file",
 129    "find_commit_signers_cmd" =>
 130	"git log --no-color " .
 131	    '--numstat ' .
 132	    '--format="GitCommit: %H%n' .
 133		      'GitAuthor: %an <%ae>%n' .
 134		      'GitDate: %aD%n' .
 135		      'GitSubject: %s%n' .
 136		      '%b%n"' .
 137	    " -1 \$commit",
 138    "find_commit_author_cmd" =>
 139	"git log --no-color " .
 140	    '--numstat ' .
 141	    '--format="GitCommit: %H%n' .
 142		      'GitAuthor: %an <%ae>%n' .
 143		      'GitDate: %aD%n' .
 144		      'GitSubject: %s%n"' .
 145	    " -1 \$commit",
 146    "blame_range_cmd" => "git blame -l -L \$diff_start,+\$diff_length \$file",
 147    "blame_file_cmd" => "git blame -l \$file",
 148    "commit_pattern" => "^GitCommit: ([0-9a-f]{40,40})",
 149    "blame_commit_pattern" => "^([0-9a-f]+) ",
 150    "author_pattern" => "^GitAuthor: (.*)",
 151    "subject_pattern" => "^GitSubject: (.*)",
 152    "stat_pattern" => "^(\\d+)\\t(\\d+)\\t\$file\$",
 153    "file_exists_cmd" => "git ls-files \$file",
 154    "list_files_cmd" => "git ls-files \$file",
 155);
 156
 157my %VCS_cmds_hg = (
 158    "execute_cmd" => \&hg_execute_cmd,
 159    "available" => '(which("hg") ne "") && (-d ".hg")',
 160    "find_signers_cmd" =>
 161	"hg log --date=\$email_hg_since " .
 162	    "--template='HgCommit: {node}\\n" .
 163	                "HgAuthor: {author}\\n" .
 164			"HgSubject: {desc}\\n'" .
 165	    " -- \$file",
 166    "find_commit_signers_cmd" =>
 167	"hg log " .
 168	    "--template='HgSubject: {desc}\\n'" .
 169	    " -r \$commit",
 170    "find_commit_author_cmd" =>
 171	"hg log " .
 172	    "--template='HgCommit: {node}\\n" .
 173		        "HgAuthor: {author}\\n" .
 174			"HgSubject: {desc|firstline}\\n'" .
 175	    " -r \$commit",
 176    "blame_range_cmd" => "",		# not supported
 177    "blame_file_cmd" => "hg blame -n \$file",
 178    "commit_pattern" => "^HgCommit: ([0-9a-f]{40,40})",
 179    "blame_commit_pattern" => "^([ 0-9a-f]+):",
 180    "author_pattern" => "^HgAuthor: (.*)",
 181    "subject_pattern" => "^HgSubject: (.*)",
 182    "stat_pattern" => "^(\\d+)\t(\\d+)\t\$file\$",
 183    "file_exists_cmd" => "hg files \$file",
 184    "list_files_cmd" => "hg manifest -R \$file",
 185);
 186
 187my $conf = which_conf(".get_maintainer.conf");
 188if (-f $conf) {
 189    my @conf_args;
 190    open(my $conffile, '<', "$conf")
 191	or warn "$P: Can't find a readable .get_maintainer.conf file $!\n";
 192
 193    while (<$conffile>) {
 194	my $line = $_;
 195
 196	$line =~ s/\s*\n?$//g;
 197	$line =~ s/^\s*//g;
 198	$line =~ s/\s+/ /g;
 199
 200	next if ($line =~ m/^\s*#/);
 201	next if ($line =~ m/^\s*$/);
 202
 203	my @words = split(" ", $line);
 204	foreach my $word (@words) {
 205	    last if ($word =~ m/^#/);
 206	    push (@conf_args, $word);
 207	}
 208    }
 209    close($conffile);
 210    unshift(@ARGV, @conf_args) if @conf_args;
 211}
 212
 213my @ignore_emails = ();
 214my $ignore_file = which_conf(".get_maintainer.ignore");
 215if (-f $ignore_file) {
 216    open(my $ignore, '<', "$ignore_file")
 217	or warn "$P: Can't find a readable .get_maintainer.ignore file $!\n";
 218    while (<$ignore>) {
 219	my $line = $_;
 220
 221	$line =~ s/\s*\n?$//;
 222	$line =~ s/^\s*//;
 223	$line =~ s/\s+$//;
 224	$line =~ s/#.*$//;
 225
 226	next if ($line =~ m/^\s*$/);
 227	if (rfc822_valid($line)) {
 228	    push(@ignore_emails, $line);
 229	}
 230    }
 231    close($ignore);
 232}
 233
 234if ($#ARGV > 0) {
 235    foreach (@ARGV) {
 236        if ($_ =~ /^-{1,2}self-test(?:=|$)/) {
 237            die "$P: using --self-test does not allow any other option or argument\n";
 238        }
 239    }
 240}
 241
 242if (!GetOptions(
 243		'email!' => \$email,
 244		'git!' => \$email_git,
 245		'git-all-signature-types!' => \$email_git_all_signature_types,
 246		'git-blame!' => \$email_git_blame,
 247		'git-blame-signatures!' => \$email_git_blame_signatures,
 248		'git-fallback!' => \$email_git_fallback,
 249		'git-chief-penguins!' => \$email_git_penguin_chiefs,
 250		'git-min-signatures=i' => \$email_git_min_signatures,
 251		'git-max-maintainers=i' => \$email_git_max_maintainers,
 252		'git-min-percent=i' => \$email_git_min_percent,
 253		'git-since=s' => \$email_git_since,
 254		'hg-since=s' => \$email_hg_since,
 255		'i|interactive!' => \$interactive,
 256		'remove-duplicates!' => \$email_remove_duplicates,
 257		'mailmap!' => \$email_use_mailmap,
 258		'm!' => \$email_maintainer,
 259		'r!' => \$email_reviewer,
 260		'n!' => \$email_usename,
 261		'l!' => \$email_list,
 262		'fixes!' => \$email_fixes,
 263		'moderated!' => \$email_moderated_list,
 264		's!' => \$email_subscriber_list,
 265		'multiline!' => \$output_multiline,
 266		'roles!' => \$output_roles,
 267		'rolestats!' => \$output_rolestats,
 268		'separator=s' => \$output_separator,
 269		'subsystem!' => \$subsystem,
 270		'status!' => \$status,
 271		'scm!' => \$scm,
 272		'tree!' => \$tree,
 273		'web!' => \$web,
 274		'letters=s' => \$letters,
 275		'pattern-depth=i' => \$pattern_depth,
 276		'k|keywords!' => \$keywords,
 277		'kf|keywords-in-file!' => \$keywords_in_file,
 278		'sections!' => \$sections,
 279		'fe|file-emails!' => \$email_file_emails,
 280		'f|file' => \$from_filename,
 281		'find-maintainer-files' => \$find_maintainer_files,
 282		'mpath|maintainer-path=s' => \$maintainer_path,
 283		'self-test:s' => \$self_test,
 284		'v|version' => \$version,
 285		'h|help|usage' => \$help,
 286		)) {
 287    die "$P: invalid argument - use --help if necessary\n";
 288}
 289
 290if ($help != 0) {
 291    usage();
 292    exit 0;
 293}
 294
 295if ($version != 0) {
 296    print("${P} ${V}\n");
 297    exit 0;
 298}
 299
 300if (defined $self_test) {
 301    read_all_maintainer_files();
 302    self_test();
 303    exit 0;
 304}
 305
 306if (-t STDIN && !@ARGV) {
 307    # We're talking to a terminal, but have no command line arguments.
 308    die "$P: missing patchfile or -f file - use --help if necessary\n";
 309}
 310
 311$output_multiline = 0 if ($output_separator ne ", ");
 312$output_rolestats = 1 if ($interactive);
 313$output_roles = 1 if ($output_rolestats);
 314
 315if ($sections || $letters ne "") {
 316    $sections = 1;
 317    $email = 0;
 318    $email_list = 0;
 319    $scm = 0;
 320    $status = 0;
 321    $subsystem = 0;
 322    $web = 0;
 323    $keywords = 0;
 324    $keywords_in_file = 0;
 325    $interactive = 0;
 326} else {
 327    my $selections = $email + $scm + $status + $subsystem + $web;
 328    if ($selections == 0) {
 329	die "$P:  Missing required option: email, scm, status, subsystem or web\n";
 330    }
 331}
 332
 333if ($email &&
 334    ($email_maintainer + $email_reviewer +
 335     $email_list + $email_subscriber_list +
 336     $email_git + $email_git_penguin_chiefs + $email_git_blame) == 0) {
 337    die "$P: Please select at least 1 email option\n";
 338}
 339
 340if ($tree && !top_of_kernel_tree($lk_path)) {
 341    die "$P: The current directory does not appear to be "
 342	. "a linux kernel source tree.\n";
 343}
 344
 345## Read MAINTAINERS for type/value pairs
 346
 347my @typevalue = ();
 348my %keyword_hash;
 349my @mfiles = ();
 350my @self_test_info = ();
 351
 352sub read_maintainer_file {
 353    my ($file) = @_;
 
 
 354
 355    open (my $maint, '<', "$file")
 356	or die "$P: Can't open MAINTAINERS file '$file': $!\n";
 357    my $i = 1;
 358    while (<$maint>) {
 359	my $line = $_;
 360	chomp $line;
 361
 362	if ($line =~ m/^([A-Z]):\s*(.*)/) {
 363	    my $type = $1;
 364	    my $value = $2;
 365
 366	    ##Filename pattern matching
 367	    if ($type eq "F" || $type eq "X") {
 368		$value =~ s@\.@\\\.@g;       ##Convert . to \.
 369		$value =~ s/\*/\.\*/g;       ##Convert * to .*
 370		$value =~ s/\?/\./g;         ##Convert ? to .
 371		##if pattern is a directory and it lacks a trailing slash, add one
 372		if ((-d $value)) {
 373		    $value =~ s@([^/])$@$1/@;
 374		}
 375	    } elsif ($type eq "K") {
 376		$keyword_hash{@typevalue} = $value;
 377	    }
 378	    push(@typevalue, "$type:$value");
 379	} elsif (!(/^\s*$/ || /^\s*\#/)) {
 380	    push(@typevalue, $line);
 381	}
 382	if (defined $self_test) {
 383	    push(@self_test_info, {file=>$file, linenr=>$i, line=>$line});
 384	}
 385	$i++;
 386    }
 387    close($maint);
 388}
 389
 390sub find_is_maintainer_file {
 391    my ($file) = $_;
 392    return if ($file !~ m@/MAINTAINERS$@);
 393    $file = $File::Find::name;
 394    return if (! -f $file);
 395    push(@mfiles, $file);
 396}
 397
 398sub find_ignore_git {
 399    return grep { $_ !~ /^\.git$/; } @_;
 400}
 401
 402read_all_maintainer_files();
 403
 404sub read_all_maintainer_files {
 405    my $path = "${lk_path}MAINTAINERS";
 406    if (defined $maintainer_path) {
 407	$path = $maintainer_path;
 408	# Perl Cookbook tilde expansion if necessary
 409	$path =~ s@^~([^/]*)@ $1 ? (getpwnam($1))[7] : ( $ENV{HOME} || $ENV{LOGDIR} || (getpwuid($<))[7])@ex;
 410    }
 411
 412    if (-d $path) {
 413	$path .= '/' if ($path !~ m@/$@);
 414	if ($find_maintainer_files) {
 415	    find( { wanted => \&find_is_maintainer_file,
 416		    preprocess => \&find_ignore_git,
 417		    no_chdir => 1,
 418		}, "$path");
 419	} else {
 420	    opendir(DIR, "$path") or die $!;
 421	    my @files = readdir(DIR);
 422	    closedir(DIR);
 423	    foreach my $file (@files) {
 424		push(@mfiles, "$path$file") if ($file !~ /^\./);
 425	    }
 
 
 426	}
 427    } elsif (-f "$path") {
 428	push(@mfiles, "$path");
 429    } else {
 430	die "$P: MAINTAINER file not found '$path'\n";
 431    }
 432    die "$P: No MAINTAINER files found in '$path'\n" if (scalar(@mfiles) == 0);
 433    foreach my $file (@mfiles) {
 434	read_maintainer_file("$file");
 435    }
 436}
 
 437
 438sub maintainers_in_file {
 439    my ($file) = @_;
 440
 441    return if ($file =~ m@\bMAINTAINERS$@);
 442
 443    if (-f $file && ($email_file_emails || $file =~ /\.yaml$/)) {
 444	open(my $f, '<', $file)
 445	    or die "$P: Can't open $file: $!\n";
 446	my $text = do { local($/) ; <$f> };
 447	close($f);
 448
 449	my @poss_addr = $text =~ m$[\p{L}\"\' \,\.\+-]*\s*[\,]*\s*[\(\<\{]{0,1}[A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+\.[A-Za-z0-9]+[\)\>\}]{0,1}$g;
 450	push(@file_emails, clean_file_emails(@poss_addr));
 451    }
 452}
 453
 454#
 455# Read mail address map
 456#
 457
 458my $mailmap;
 459
 460read_mailmap();
 461
 462sub read_mailmap {
 463    $mailmap = {
 464	names => {},
 465	addresses => {}
 466    };
 467
 468    return if (!$email_use_mailmap || !(-f "${lk_path}.mailmap"));
 469
 470    open(my $mailmap_file, '<', "${lk_path}.mailmap")
 471	or warn "$P: Can't open .mailmap: $!\n";
 472
 473    while (<$mailmap_file>) {
 474	s/#.*$//; #strip comments
 475	s/^\s+|\s+$//g; #trim
 476
 477	next if (/^\s*$/); #skip empty lines
 478	#entries have one of the following formats:
 479	# name1 <mail1>
 480	# <mail1> <mail2>
 481	# name1 <mail1> <mail2>
 482	# name1 <mail1> name2 <mail2>
 483	# (see man git-shortlog)
 484
 485	if (/^([^<]+)<([^>]+)>$/) {
 486	    my $real_name = $1;
 487	    my $address = $2;
 488
 489	    $real_name =~ s/\s+$//;
 490	    ($real_name, $address) = parse_email("$real_name <$address>");
 491	    $mailmap->{names}->{$address} = $real_name;
 492
 493	} elsif (/^<([^>]+)>\s*<([^>]+)>$/) {
 494	    my $real_address = $1;
 495	    my $wrong_address = $2;
 496
 497	    $mailmap->{addresses}->{$wrong_address} = $real_address;
 498
 499	} elsif (/^(.+)<([^>]+)>\s*<([^>]+)>$/) {
 500	    my $real_name = $1;
 501	    my $real_address = $2;
 502	    my $wrong_address = $3;
 503
 504	    $real_name =~ s/\s+$//;
 505	    ($real_name, $real_address) =
 506		parse_email("$real_name <$real_address>");
 507	    $mailmap->{names}->{$wrong_address} = $real_name;
 508	    $mailmap->{addresses}->{$wrong_address} = $real_address;
 509
 510	} elsif (/^(.+)<([^>]+)>\s*(.+)\s*<([^>]+)>$/) {
 511	    my $real_name = $1;
 512	    my $real_address = $2;
 513	    my $wrong_name = $3;
 514	    my $wrong_address = $4;
 515
 516	    $real_name =~ s/\s+$//;
 517	    ($real_name, $real_address) =
 518		parse_email("$real_name <$real_address>");
 519
 520	    $wrong_name =~ s/\s+$//;
 521	    ($wrong_name, $wrong_address) =
 522		parse_email("$wrong_name <$wrong_address>");
 523
 524	    my $wrong_email = format_email($wrong_name, $wrong_address, 1);
 525	    $mailmap->{names}->{$wrong_email} = $real_name;
 526	    $mailmap->{addresses}->{$wrong_email} = $real_address;
 527	}
 528    }
 529    close($mailmap_file);
 530}
 531
 532## use the filenames on the command line or find the filenames in the patchfiles
 533
 
 
 
 
 
 534if (!@ARGV) {
 535    push(@ARGV, "&STDIN");
 536}
 537
 538foreach my $file (@ARGV) {
 539    if ($file ne "&STDIN") {
 540	$file = canonpath($file);
 541	##if $file is a directory and it lacks a trailing slash, add one
 542	if ((-d $file)) {
 543	    $file =~ s@([^/])$@$1/@;
 544	} elsif (!(-f $file)) {
 545	    die "$P: file '${file}' not found\n";
 546	}
 547    }
 548    if ($from_filename && (vcs_exists() && !vcs_file_exists($file))) {
 549	warn "$P: file '$file' not found in version control $!\n";
 550    }
 551    if ($from_filename || ($file ne "&STDIN" && vcs_file_exists($file))) {
 552	$file =~ s/^\Q${cur_path}\E//;	#strip any absolute path
 553	$file =~ s/^\Q${lk_path}\E//;	#or the path to the lk tree
 554	push(@files, $file);
 555	if ($file ne "MAINTAINERS" && -f $file && $keywords && $keywords_in_file) {
 556	    open(my $f, '<', $file)
 557		or die "$P: Can't open $file: $!\n";
 558	    my $text = do { local($/) ; <$f> };
 559	    close($f);
 560	    foreach my $line (keys %keyword_hash) {
 561		if ($text =~ m/$keyword_hash{$line}/x) {
 562		    push(@keyword_tvi, $line);
 
 
 563		}
 564	    }
 
 
 
 
 565	}
 566    } else {
 567	my $file_cnt = @files;
 568	my $lastfile;
 569
 570	open(my $patch, "< $file")
 571	    or die "$P: Can't open $file: $!\n";
 572
 573	# We can check arbitrary information before the patch
 574	# like the commit message, mail headers, etc...
 575	# This allows us to match arbitrary keywords against any part
 576	# of a git format-patch generated file (subject tags, etc...)
 577
 578	my $patch_prefix = "";			#Parsing the intro
 579
 580	while (<$patch>) {
 581	    my $patch_line = $_;
 582	    if (m/^ mode change [0-7]+ => [0-7]+ (\S+)\s*$/) {
 583		my $filename = $1;
 584		push(@files, $filename);
 585	    } elsif (m/^rename (?:from|to) (\S+)\s*$/) {
 586		my $filename = $1;
 587		push(@files, $filename);
 588	    } elsif (m/^diff --git a\/(\S+) b\/(\S+)\s*$/) {
 589		my $filename1 = $1;
 590		my $filename2 = $2;
 591		push(@files, $filename1);
 592		push(@files, $filename2);
 593	    } elsif (m/^Fixes:\s+([0-9a-fA-F]{6,40})/) {
 594		push(@fixes, $1) if ($email_fixes);
 595	    } elsif (m/^\+\+\+\s+(\S+)/ or m/^---\s+(\S+)/) {
 596		my $filename = $1;
 597		$filename =~ s@^[^/]*/@@;
 598		$filename =~ s@\n@@;
 599		$lastfile = $filename;
 600		push(@files, $filename);
 601		$patch_prefix = "^[+-].*";	#Now parsing the actual patch
 602	    } elsif (m/^\@\@ -(\d+),(\d+)/) {
 603		if ($email_git_blame) {
 604		    push(@range, "$lastfile:$1:$2");
 605		}
 606	    } elsif ($keywords) {
 607		foreach my $line (keys %keyword_hash) {
 608		    if ($patch_line =~ m/${patch_prefix}$keyword_hash{$line}/x) {
 609			push(@keyword_tvi, $line);
 610		    }
 611		}
 612	    }
 613	}
 614	close($patch);
 615
 616	if ($file_cnt == @files) {
 617	    warn "$P: file '${file}' doesn't appear to be a patch.  "
 618		. "Add -f to options?\n";
 619	}
 620	@files = sort_and_uniq(@files);
 621    }
 622}
 623
 624@file_emails = uniq(@file_emails);
 625@fixes = uniq(@fixes);
 626
 627my %email_hash_name;
 628my %email_hash_address;
 629my @email_to = ();
 630my %hash_list_to;
 631my @list_to = ();
 632my @scm = ();
 633my @web = ();
 634my @subsystem = ();
 635my @status = ();
 636my %deduplicate_name_hash = ();
 637my %deduplicate_address_hash = ();
 638
 639my @maintainers = get_maintainers();
 
 640if (@maintainers) {
 641    @maintainers = merge_email(@maintainers);
 642    output(@maintainers);
 643}
 644
 645if ($scm) {
 646    @scm = uniq(@scm);
 647    output(@scm);
 648}
 649
 650if ($status) {
 651    @status = uniq(@status);
 652    output(@status);
 653}
 654
 655if ($subsystem) {
 656    @subsystem = uniq(@subsystem);
 657    output(@subsystem);
 658}
 659
 660if ($web) {
 661    @web = uniq(@web);
 662    output(@web);
 663}
 664
 665exit($exit);
 666
 667sub self_test {
 668    my @lsfiles = ();
 669    my @good_links = ();
 670    my @bad_links = ();
 671    my @section_headers = ();
 672    my $index = 0;
 673
 674    @lsfiles = vcs_list_files($lk_path);
 675
 676    for my $x (@self_test_info) {
 677	$index++;
 678
 679	## Section header duplication and missing section content
 680	if (($self_test eq "" || $self_test =~ /\bsections\b/) &&
 681	    $x->{line} =~ /^\S[^:]/ &&
 682	    defined $self_test_info[$index] &&
 683	    $self_test_info[$index]->{line} =~ /^([A-Z]):\s*\S/) {
 684	    my $has_S = 0;
 685	    my $has_F = 0;
 686	    my $has_ML = 0;
 687	    my $status = "";
 688	    if (grep(m@^\Q$x->{line}\E@, @section_headers)) {
 689		print("$x->{file}:$x->{linenr}: warning: duplicate section header\t$x->{line}\n");
 690	    } else {
 691		push(@section_headers, $x->{line});
 692	    }
 693	    my $nextline = $index;
 694	    while (defined $self_test_info[$nextline] &&
 695		   $self_test_info[$nextline]->{line} =~ /^([A-Z]):\s*(\S.*)/) {
 696		my $type = $1;
 697		my $value = $2;
 698		if ($type eq "S") {
 699		    $has_S = 1;
 700		    $status = $value;
 701		} elsif ($type eq "F" || $type eq "N") {
 702		    $has_F = 1;
 703		} elsif ($type eq "M" || $type eq "R" || $type eq "L") {
 704		    $has_ML = 1;
 705		}
 706		$nextline++;
 707	    }
 708	    if (!$has_ML && $status !~ /orphan|obsolete/i) {
 709		print("$x->{file}:$x->{linenr}: warning: section without email address\t$x->{line}\n");
 710	    }
 711	    if (!$has_S) {
 712		print("$x->{file}:$x->{linenr}: warning: section without status \t$x->{line}\n");
 713	    }
 714	    if (!$has_F) {
 715		print("$x->{file}:$x->{linenr}: warning: section without file pattern\t$x->{line}\n");
 716	    }
 717	}
 718
 719	next if ($x->{line} !~ /^([A-Z]):\s*(.*)/);
 720
 721	my $type = $1;
 722	my $value = $2;
 723
 724	## Filename pattern matching
 725	if (($type eq "F" || $type eq "X") &&
 726	    ($self_test eq "" || $self_test =~ /\bpatterns\b/)) {
 727	    $value =~ s@\.@\\\.@g;       ##Convert . to \.
 728	    $value =~ s/\*/\.\*/g;       ##Convert * to .*
 729	    $value =~ s/\?/\./g;         ##Convert ? to .
 730	    ##if pattern is a directory and it lacks a trailing slash, add one
 731	    if ((-d $value)) {
 732		$value =~ s@([^/])$@$1/@;
 733	    }
 734	    if (!grep(m@^$value@, @lsfiles)) {
 735		print("$x->{file}:$x->{linenr}: warning: no file matches\t$x->{line}\n");
 736	    }
 737
 738	## Link reachability
 739	} elsif (($type eq "W" || $type eq "Q" || $type eq "B") &&
 740		 $value =~ /^https?:/ &&
 741		 ($self_test eq "" || $self_test =~ /\blinks\b/)) {
 742	    next if (grep(m@^\Q$value\E$@, @good_links));
 743	    my $isbad = 0;
 744	    if (grep(m@^\Q$value\E$@, @bad_links)) {
 745	        $isbad = 1;
 746	    } else {
 747		my $output = `wget --spider -q --no-check-certificate --timeout 10 --tries 1 $value`;
 748		if ($? == 0) {
 749		    push(@good_links, $value);
 750		} else {
 751		    push(@bad_links, $value);
 752		    $isbad = 1;
 753		}
 754	    }
 755	    if ($isbad) {
 756	        print("$x->{file}:$x->{linenr}: warning: possible bad link\t$x->{line}\n");
 757	    }
 758
 759	## SCM reachability
 760	} elsif ($type eq "T" &&
 761		 ($self_test eq "" || $self_test =~ /\bscm\b/)) {
 762	    next if (grep(m@^\Q$value\E$@, @good_links));
 763	    my $isbad = 0;
 764	    if (grep(m@^\Q$value\E$@, @bad_links)) {
 765	        $isbad = 1;
 766            } elsif ($value !~ /^(?:git|quilt|hg)\s+\S/) {
 767		print("$x->{file}:$x->{linenr}: warning: malformed entry\t$x->{line}\n");
 768	    } elsif ($value =~ /^git\s+(\S+)(\s+([^\(]+\S+))?/) {
 769		my $url = $1;
 770		my $branch = "";
 771		$branch = $3 if $3;
 772		my $output = `git ls-remote --exit-code -h "$url" $branch > /dev/null 2>&1`;
 773		if ($? == 0) {
 774		    push(@good_links, $value);
 775		} else {
 776		    push(@bad_links, $value);
 777		    $isbad = 1;
 778		}
 779	    } elsif ($value =~ /^(?:quilt|hg)\s+(https?:\S+)/) {
 780		my $url = $1;
 781		my $output = `wget --spider -q --no-check-certificate --timeout 10 --tries 1 $url`;
 782		if ($? == 0) {
 783		    push(@good_links, $value);
 784		} else {
 785		    push(@bad_links, $value);
 786		    $isbad = 1;
 787		}
 788	    }
 789	    if ($isbad) {
 790		print("$x->{file}:$x->{linenr}: warning: possible bad link\t$x->{line}\n");
 791	    }
 792	}
 793    }
 794}
 795
 796sub ignore_email_address {
 797    my ($address) = @_;
 798
 799    foreach my $ignore (@ignore_emails) {
 800	return 1 if ($ignore eq $address);
 801    }
 802
 803    return 0;
 804}
 805
 806sub range_is_maintained {
 807    my ($start, $end) = @_;
 808
 809    for (my $i = $start; $i < $end; $i++) {
 810	my $line = $typevalue[$i];
 811	if ($line =~ m/^([A-Z]):\s*(.*)/) {
 812	    my $type = $1;
 813	    my $value = $2;
 814	    if ($type eq 'S') {
 815		if ($value =~ /(maintain|support)/i) {
 816		    return 1;
 817		}
 818	    }
 819	}
 820    }
 821    return 0;
 822}
 823
 824sub range_has_maintainer {
 825    my ($start, $end) = @_;
 826
 827    for (my $i = $start; $i < $end; $i++) {
 828	my $line = $typevalue[$i];
 829	if ($line =~ m/^([A-Z]):\s*(.*)/) {
 830	    my $type = $1;
 831	    my $value = $2;
 832	    if ($type eq 'M') {
 833		return 1;
 834	    }
 835	}
 836    }
 837    return 0;
 838}
 839
 840sub get_maintainers {
 841    %email_hash_name = ();
 842    %email_hash_address = ();
 843    %commit_author_hash = ();
 844    %commit_signer_hash = ();
 845    @email_to = ();
 846    %hash_list_to = ();
 847    @list_to = ();
 848    @scm = ();
 849    @web = ();
 850    @subsystem = ();
 851    @status = ();
 852    %deduplicate_name_hash = ();
 853    %deduplicate_address_hash = ();
 854    if ($email_git_all_signature_types) {
 855	$signature_pattern = "(.+?)[Bb][Yy]:";
 856    } else {
 857	$signature_pattern = "\(" . join("|", @signature_tags) . "\)";
 858    }
 859
 860    # Find responsible parties
 861
 862    my %exact_pattern_match_hash = ();
 863
 864    foreach my $file (@files) {
 865
 866	my %hash;
 867	my $tvi = find_first_section();
 868	while ($tvi < @typevalue) {
 869	    my $start = find_starting_index($tvi);
 870	    my $end = find_ending_index($tvi);
 871	    my $exclude = 0;
 872	    my $i;
 873
 874	    #Do not match excluded file patterns
 875
 876	    for ($i = $start; $i < $end; $i++) {
 877		my $line = $typevalue[$i];
 878		if ($line =~ m/^([A-Z]):\s*(.*)/) {
 879		    my $type = $1;
 880		    my $value = $2;
 881		    if ($type eq 'X') {
 882			if (file_match_pattern($file, $value)) {
 883			    $exclude = 1;
 884			    last;
 885			}
 886		    }
 887		}
 888	    }
 889
 890	    if (!$exclude) {
 891		for ($i = $start; $i < $end; $i++) {
 892		    my $line = $typevalue[$i];
 893		    if ($line =~ m/^([A-Z]):\s*(.*)/) {
 894			my $type = $1;
 895			my $value = $2;
 896			if ($type eq 'F') {
 897			    if (file_match_pattern($file, $value)) {
 898				my $value_pd = ($value =~ tr@/@@);
 899				my $file_pd = ($file  =~ tr@/@@);
 900				$value_pd++ if (substr($value,-1,1) ne "/");
 901				$value_pd = -1 if ($value =~ /^\.\*/);
 902				if ($value_pd >= $file_pd &&
 903				    range_is_maintained($start, $end) &&
 904				    range_has_maintainer($start, $end)) {
 905				    $exact_pattern_match_hash{$file} = 1;
 906				}
 907				if ($pattern_depth == 0 ||
 908				    (($file_pd - $value_pd) < $pattern_depth)) {
 909				    $hash{$tvi} = $value_pd;
 910				}
 911			    }
 912			} elsif ($type eq 'N') {
 913			    if ($file =~ m/$value/x) {
 914				$hash{$tvi} = 0;
 915			    }
 916			}
 917		    }
 918		}
 919	    }
 920	    $tvi = $end + 1;
 921	}
 922
 923	foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
 924	    add_categories($line, "");
 925	    if ($sections) {
 926		my $i;
 927		my $start = find_starting_index($line);
 928		my $end = find_ending_index($line);
 929		for ($i = $start; $i < $end; $i++) {
 930		    my $line = $typevalue[$i];
 931		    if ($line =~ /^[FX]:/) {		##Restore file patterns
 932			$line =~ s/([^\\])\.([^\*])/$1\?$2/g;
 933			$line =~ s/([^\\])\.$/$1\?/g;	##Convert . back to ?
 934			$line =~ s/\\\./\./g;       	##Convert \. to .
 935			$line =~ s/\.\*/\*/g;       	##Convert .* to *
 936		    }
 937		    my $count = $line =~ s/^([A-Z]):/$1:\t/g;
 938		    if ($letters eq "" || (!$count || $letters =~ /$1/i)) {
 939			print("$line\n");
 940		    }
 941		}
 942		print("\n");
 943	    }
 944	}
 945
 946	maintainers_in_file($file);
 947    }
 948
 949    if ($keywords) {
 950	@keyword_tvi = sort_and_uniq(@keyword_tvi);
 951	foreach my $line (@keyword_tvi) {
 952	    add_categories($line, ":Keyword:$keyword_hash{$line}");
 953	}
 954    }
 955
 956    foreach my $email (@email_to, @list_to) {
 957	$email->[0] = deduplicate_email($email->[0]);
 958    }
 959
 960    foreach my $file (@files) {
 961	if ($email &&
 962	    ($email_git ||
 963	     ($email_git_fallback &&
 964	      $file !~ /MAINTAINERS$/ &&
 965	      !$exact_pattern_match_hash{$file}))) {
 966	    vcs_file_signoffs($file);
 967	}
 968	if ($email && $email_git_blame) {
 969	    vcs_file_blame($file);
 970	}
 971    }
 972
 973    if ($email) {
 974	foreach my $chief (@penguin_chief) {
 975	    if ($chief =~ m/^(.*):(.*)/) {
 976		my $email_address;
 977
 978		$email_address = format_email($1, $2, $email_usename);
 979		if ($email_git_penguin_chiefs) {
 980		    push(@email_to, [$email_address, 'chief penguin']);
 981		} else {
 982		    @email_to = grep($_->[0] !~ /${email_address}/, @email_to);
 983		}
 984	    }
 985	}
 986
 987	foreach my $email (@file_emails) {
 988	    $email = mailmap_email($email);
 989	    my ($name, $address) = parse_email($email);
 990
 991	    my $tmp_email = format_email($name, $address, $email_usename);
 992	    push_email_address($tmp_email, '');
 993	    add_role($tmp_email, 'in file');
 994	}
 995    }
 996
 997    foreach my $fix (@fixes) {
 998	vcs_add_commit_signers($fix, "blamed_fixes");
 999    }
1000
1001    my @to = ();
1002    if ($email || $email_list) {
1003	if ($email) {
1004	    @to = (@to, @email_to);
1005	}
1006	if ($email_list) {
1007	    @to = (@to, @list_to);
1008	}
1009    }
1010
1011    if ($interactive) {
1012	@to = interactive_get_maintainers(\@to);
1013    }
1014
1015    return @to;
1016}
1017
1018sub file_match_pattern {
1019    my ($file, $pattern) = @_;
1020    if (substr($pattern, -1) eq "/") {
1021	if ($file =~ m@^$pattern@) {
1022	    return 1;
1023	}
1024    } else {
1025	if ($file =~ m@^$pattern@) {
1026	    my $s1 = ($file =~ tr@/@@);
1027	    my $s2 = ($pattern =~ tr@/@@);
1028	    if ($s1 == $s2) {
1029		return 1;
1030	    }
1031	}
1032    }
1033    return 0;
1034}
1035
1036sub usage {
1037    print <<EOT;
1038usage: $P [options] patchfile
1039       $P [options] -f file|directory
1040version: $V
1041
1042MAINTAINER field selection options:
1043  --email => print email address(es) if any
1044    --git => include recent git \*-by: signers
1045    --git-all-signature-types => include signers regardless of signature type
1046        or use only ${signature_pattern} signers (default: $email_git_all_signature_types)
1047    --git-fallback => use git when no exact MAINTAINERS pattern (default: $email_git_fallback)
1048    --git-chief-penguins => include ${penguin_chiefs}
1049    --git-min-signatures => number of signatures required (default: $email_git_min_signatures)
1050    --git-max-maintainers => maximum maintainers to add (default: $email_git_max_maintainers)
1051    --git-min-percent => minimum percentage of commits required (default: $email_git_min_percent)
1052    --git-blame => use git blame to find modified commits for patch or file
1053    --git-blame-signatures => when used with --git-blame, also include all commit signers
1054    --git-since => git history to use (default: $email_git_since)
1055    --hg-since => hg history to use (default: $email_hg_since)
1056    --interactive => display a menu (mostly useful if used with the --git option)
1057    --m => include maintainer(s) if any
1058    --r => include reviewer(s) if any
1059    --n => include name 'Full Name <addr\@domain.tld>'
1060    --l => include list(s) if any
1061    --moderated => include moderated lists(s) if any (default: true)
1062    --s => include subscriber only list(s) if any (default: false)
1063    --remove-duplicates => minimize duplicate email names/addresses
1064    --roles => show roles (status:subsystem, git-signer, list, etc...)
1065    --rolestats => show roles and statistics (commits/total_commits, %)
1066    --file-emails => add email addresses found in -f file (default: 0 (off))
1067    --fixes => for patches, add signatures of commits with 'Fixes: <commit>' (default: 1 (on))
1068  --scm => print SCM tree(s) if any
1069  --status => print status if any
1070  --subsystem => print subsystem name if any
1071  --web => print website(s) if any
1072
1073Output type options:
1074  --separator [, ] => separator for multiple entries on 1 line
1075    using --separator also sets --nomultiline if --separator is not [, ]
1076  --multiline => print 1 entry per line
1077
1078Other options:
1079  --pattern-depth => Number of pattern directory traversals (default: 0 (all))
1080  --keywords => scan patch for keywords (default: $keywords)
1081  --keywords-in-file => scan file for keywords (default: $keywords_in_file)
1082  --sections => print all of the subsystem sections with pattern matches
1083  --letters => print all matching 'letter' types from all matching sections
1084  --mailmap => use .mailmap file (default: $email_use_mailmap)
1085  --no-tree => run without a kernel tree
1086  --self-test => show potential issues with MAINTAINERS file content
1087  --version => show version
1088  --help => show this help information
1089
1090Default options:
1091  [--email --tree --nogit --git-fallback --m --r --n --l --multiline
1092   --pattern-depth=0 --remove-duplicates --rolestats --keywords]
1093
1094Notes:
1095  Using "-f directory" may give unexpected results:
1096      Used with "--git", git signators for _all_ files in and below
1097          directory are examined as git recurses directories.
1098          Any specified X: (exclude) pattern matches are _not_ ignored.
1099      Used with "--nogit", directory is used as a pattern match,
1100          no individual file within the directory or subdirectory
1101          is matched.
1102      Used with "--git-blame", does not iterate all files in directory
1103  Using "--git-blame" is slow and may add old committers and authors
1104      that are no longer active maintainers to the output.
1105  Using "--roles" or "--rolestats" with git send-email --cc-cmd or any
1106      other automated tools that expect only ["name"] <email address>
1107      may not work because of additional output after <email address>.
1108  Using "--rolestats" and "--git-blame" shows the #/total=% commits,
1109      not the percentage of the entire file authored.  # of commits is
1110      not a good measure of amount of code authored.  1 major commit may
1111      contain a thousand lines, 5 trivial commits may modify a single line.
1112  If git is not installed, but mercurial (hg) is installed and an .hg
1113      repository exists, the following options apply to mercurial:
1114          --git,
1115          --git-min-signatures, --git-max-maintainers, --git-min-percent, and
1116          --git-blame
1117      Use --hg-since not --git-since to control date selection
1118  File ".get_maintainer.conf", if it exists in the linux kernel source root
1119      directory, can change whatever get_maintainer defaults are desired.
1120      Entries in this file can be any command line argument.
1121      This file is prepended to any additional command line arguments.
1122      Multiple lines and # comments are allowed.
1123  Most options have both positive and negative forms.
1124      The negative forms for --<foo> are --no<foo> and --no-<foo>.
1125
1126EOT
1127}
1128
1129sub top_of_kernel_tree {
1130    my ($lk_path) = @_;
1131
1132    if ($lk_path ne "" && substr($lk_path,length($lk_path)-1,1) ne "/") {
1133	$lk_path .= "/";
1134    }
1135    if (   (-f "${lk_path}COPYING")
1136	&& (-f "${lk_path}CREDITS")
1137	&& (-f "${lk_path}Kbuild")
1138	&& (-e "${lk_path}MAINTAINERS")
1139	&& (-f "${lk_path}Makefile")
1140	&& (-f "${lk_path}README")
1141	&& (-d "${lk_path}Documentation")
1142	&& (-d "${lk_path}arch")
1143	&& (-d "${lk_path}include")
1144	&& (-d "${lk_path}drivers")
1145	&& (-d "${lk_path}fs")
1146	&& (-d "${lk_path}init")
1147	&& (-d "${lk_path}ipc")
1148	&& (-d "${lk_path}kernel")
1149	&& (-d "${lk_path}lib")
1150	&& (-d "${lk_path}scripts")) {
1151	return 1;
1152    }
1153    return 0;
1154}
1155
1156sub escape_name {
1157    my ($name) = @_;
1158
1159    if ($name =~ /[^\w \-]/ai) {  	 ##has "must quote" chars
1160	$name =~ s/(?<!\\)"/\\"/g;       ##escape quotes
1161	$name = "\"$name\"";
1162    }
1163
1164    return $name;
1165}
1166
1167sub parse_email {
1168    my ($formatted_email) = @_;
1169
1170    my $name = "";
1171    my $address = "";
1172
1173    if ($formatted_email =~ /^([^<]+)<(.+\@.*)>.*$/) {
1174	$name = $1;
1175	$address = $2;
1176    } elsif ($formatted_email =~ /^\s*<(.+\@\S*)>.*$/) {
1177	$address = $1;
1178    } elsif ($formatted_email =~ /^(.+\@\S*).*$/) {
1179	$address = $1;
1180    }
1181
1182    $name =~ s/^\s+|\s+$//g;
1183    $name =~ s/^\"|\"$//g;
1184    $name = escape_name($name);
1185    $address =~ s/^\s+|\s+$//g;
1186
 
 
 
 
 
1187    return ($name, $address);
1188}
1189
1190sub format_email {
1191    my ($name, $address, $usename) = @_;
1192
1193    my $formatted_email;
1194
1195    $name =~ s/^\s+|\s+$//g;
1196    $name =~ s/^\"|\"$//g;
1197    $name = escape_name($name);
1198    $address =~ s/^\s+|\s+$//g;
1199
 
 
 
 
 
1200    if ($usename) {
1201	if ("$name" eq "") {
1202	    $formatted_email = "$address";
1203	} else {
1204	    $formatted_email = "$name <$address>";
1205	}
1206    } else {
1207	$formatted_email = $address;
1208    }
1209
1210    return $formatted_email;
1211}
1212
1213sub find_first_section {
1214    my $index = 0;
1215
1216    while ($index < @typevalue) {
1217	my $tv = $typevalue[$index];
1218	if (($tv =~ m/^([A-Z]):\s*(.*)/)) {
1219	    last;
1220	}
1221	$index++;
1222    }
1223
1224    return $index;
1225}
1226
1227sub find_starting_index {
1228    my ($index) = @_;
1229
1230    while ($index > 0) {
1231	my $tv = $typevalue[$index];
1232	if (!($tv =~ m/^([A-Z]):\s*(.*)/)) {
1233	    last;
1234	}
1235	$index--;
1236    }
1237
1238    return $index;
1239}
1240
1241sub find_ending_index {
1242    my ($index) = @_;
1243
1244    while ($index < @typevalue) {
1245	my $tv = $typevalue[$index];
1246	if (!($tv =~ m/^([A-Z]):\s*(.*)/)) {
1247	    last;
1248	}
1249	$index++;
1250    }
1251
1252    return $index;
1253}
1254
1255sub get_subsystem_name {
1256    my ($index) = @_;
1257
 
1258    my $start = find_starting_index($index);
 
1259
 
1260    my $subsystem = $typevalue[$start];
1261    if ($output_section_maxlen && length($subsystem) > $output_section_maxlen) {
1262	$subsystem = substr($subsystem, 0, $output_section_maxlen - 3);
1263	$subsystem =~ s/\s*$//;
1264	$subsystem = $subsystem . "...";
1265    }
1266    return $subsystem;
1267}
1268
1269sub get_maintainer_role {
1270    my ($index) = @_;
1271
1272    my $i;
1273    my $start = find_starting_index($index);
1274    my $end = find_ending_index($index);
1275
1276    my $role = "unknown";
1277    my $subsystem = get_subsystem_name($index);
1278
1279    for ($i = $start + 1; $i < $end; $i++) {
1280	my $tv = $typevalue[$i];
1281	if ($tv =~ m/^([A-Z]):\s*(.*)/) {
1282	    my $ptype = $1;
1283	    my $pvalue = $2;
1284	    if ($ptype eq "S") {
1285		$role = $pvalue;
1286	    }
1287	}
1288    }
1289
1290    $role = lc($role);
1291    if      ($role eq "supported") {
1292	$role = "supporter";
1293    } elsif ($role eq "maintained") {
1294	$role = "maintainer";
1295    } elsif ($role eq "odd fixes") {
1296	$role = "odd fixer";
1297    } elsif ($role eq "orphan") {
1298	$role = "orphan minder";
1299    } elsif ($role eq "obsolete") {
1300	$role = "obsolete minder";
1301    } elsif ($role eq "buried alive in reporters") {
1302	$role = "chief penguin";
1303    }
1304
1305    return $role . ":" . $subsystem;
1306}
1307
1308sub get_list_role {
1309    my ($index) = @_;
1310
1311    my $subsystem = get_subsystem_name($index);
 
 
 
 
 
 
 
 
 
1312
1313    if ($subsystem eq "THE REST") {
1314	$subsystem = "";
1315    }
1316
1317    return $subsystem;
1318}
1319
1320sub add_categories {
1321    my ($index, $suffix) = @_;
1322
1323    my $i;
1324    my $start = find_starting_index($index);
1325    my $end = find_ending_index($index);
1326
1327    push(@subsystem, $typevalue[$start]);
1328
1329    for ($i = $start + 1; $i < $end; $i++) {
1330	my $tv = $typevalue[$i];
1331	if ($tv =~ m/^([A-Z]):\s*(.*)/) {
1332	    my $ptype = $1;
1333	    my $pvalue = $2;
1334	    if ($ptype eq "L") {
1335		my $list_address = $pvalue;
1336		my $list_additional = "";
1337		my $list_role = get_list_role($i);
1338
1339		if ($list_role ne "") {
1340		    $list_role = ":" . $list_role;
1341		}
1342		if ($list_address =~ m/([^\s]+)\s+(.*)$/) {
1343		    $list_address = $1;
1344		    $list_additional = $2;
1345		}
1346		if ($list_additional =~ m/subscribers-only/) {
1347		    if ($email_subscriber_list) {
1348			if (!$hash_list_to{lc($list_address)}) {
1349			    $hash_list_to{lc($list_address)} = 1;
1350			    push(@list_to, [$list_address,
1351					    "subscriber list${list_role}" . $suffix]);
1352			}
1353		    }
1354		} else {
1355		    if ($email_list) {
1356			if (!$hash_list_to{lc($list_address)}) {
 
1357			    if ($list_additional =~ m/moderated/) {
1358				if ($email_moderated_list) {
1359				    $hash_list_to{lc($list_address)} = 1;
1360				    push(@list_to, [$list_address,
1361						    "moderated list${list_role}" . $suffix]);
1362				}
1363			    } else {
1364				$hash_list_to{lc($list_address)} = 1;
1365				push(@list_to, [$list_address,
1366						"open list${list_role}" . $suffix]);
1367			    }
1368			}
1369		    }
1370		}
1371	    } elsif ($ptype eq "M") {
 
 
 
 
 
 
 
 
 
 
 
 
1372		if ($email_maintainer) {
1373		    my $role = get_maintainer_role($i);
1374		    push_email_addresses($pvalue, $role . $suffix);
1375		}
1376	    } elsif ($ptype eq "R") {
1377		if ($email_reviewer) {
1378		    my $subsystem = get_subsystem_name($i);
1379		    push_email_addresses($pvalue, "reviewer:$subsystem" . $suffix);
1380		}
1381	    } elsif ($ptype eq "T") {
1382		push(@scm, $pvalue . $suffix);
1383	    } elsif ($ptype eq "W") {
1384		push(@web, $pvalue . $suffix);
1385	    } elsif ($ptype eq "S") {
1386		push(@status, $pvalue . $suffix);
1387	    }
1388	}
1389    }
1390}
1391
1392sub email_inuse {
1393    my ($name, $address) = @_;
1394
1395    return 1 if (($name eq "") && ($address eq ""));
1396    return 1 if (($name ne "") && exists($email_hash_name{lc($name)}));
1397    return 1 if (($address ne "") && exists($email_hash_address{lc($address)}));
1398
1399    return 0;
1400}
1401
1402sub push_email_address {
1403    my ($line, $role) = @_;
1404
1405    my ($name, $address) = parse_email($line);
1406
1407    if ($address eq "") {
1408	return 0;
1409    }
1410
1411    if (!$email_remove_duplicates) {
1412	push(@email_to, [format_email($name, $address, $email_usename), $role]);
1413    } elsif (!email_inuse($name, $address)) {
1414	push(@email_to, [format_email($name, $address, $email_usename), $role]);
1415	$email_hash_name{lc($name)}++ if ($name ne "");
1416	$email_hash_address{lc($address)}++;
1417    }
1418
1419    return 1;
1420}
1421
1422sub push_email_addresses {
1423    my ($address, $role) = @_;
1424
1425    my @address_list = ();
1426
1427    if (rfc822_valid($address)) {
1428	push_email_address($address, $role);
1429    } elsif (@address_list = rfc822_validlist($address)) {
1430	my $array_count = shift(@address_list);
1431	while (my $entry = shift(@address_list)) {
1432	    push_email_address($entry, $role);
1433	}
1434    } else {
1435	if (!push_email_address($address, $role)) {
1436	    warn("Invalid MAINTAINERS address: '" . $address . "'\n");
1437	}
1438    }
1439}
1440
1441sub add_role {
1442    my ($line, $role) = @_;
1443
1444    my ($name, $address) = parse_email($line);
1445    my $email = format_email($name, $address, $email_usename);
1446
1447    foreach my $entry (@email_to) {
1448	if ($email_remove_duplicates) {
1449	    my ($entry_name, $entry_address) = parse_email($entry->[0]);
1450	    if (($name eq $entry_name || $address eq $entry_address)
1451		&& ($role eq "" || !($entry->[1] =~ m/$role/))
1452	    ) {
1453		if ($entry->[1] eq "") {
1454		    $entry->[1] = "$role";
1455		} else {
1456		    $entry->[1] = "$entry->[1],$role";
1457		}
1458	    }
1459	} else {
1460	    if ($email eq $entry->[0]
1461		&& ($role eq "" || !($entry->[1] =~ m/$role/))
1462	    ) {
1463		if ($entry->[1] eq "") {
1464		    $entry->[1] = "$role";
1465		} else {
1466		    $entry->[1] = "$entry->[1],$role";
1467		}
1468	    }
1469	}
1470    }
1471}
1472
1473sub which {
1474    my ($bin) = @_;
1475
1476    foreach my $path (split(/:/, $ENV{PATH})) {
1477	if (-e "$path/$bin") {
1478	    return "$path/$bin";
1479	}
1480    }
1481
1482    return "";
1483}
1484
1485sub which_conf {
1486    my ($conf) = @_;
1487
1488    foreach my $path (split(/:/, ".:$ENV{HOME}:.scripts")) {
1489	if (-e "$path/$conf") {
1490	    return "$path/$conf";
1491	}
1492    }
1493
1494    return "";
1495}
1496
1497sub mailmap_email {
1498    my ($line) = @_;
1499
1500    my ($name, $address) = parse_email($line);
1501    my $email = format_email($name, $address, 1);
1502    my $real_name = $name;
1503    my $real_address = $address;
1504
1505    if (exists $mailmap->{names}->{$email} ||
1506	exists $mailmap->{addresses}->{$email}) {
1507	if (exists $mailmap->{names}->{$email}) {
1508	    $real_name = $mailmap->{names}->{$email};
1509	}
1510	if (exists $mailmap->{addresses}->{$email}) {
1511	    $real_address = $mailmap->{addresses}->{$email};
1512	}
1513    } else {
1514	if (exists $mailmap->{names}->{$address}) {
1515	    $real_name = $mailmap->{names}->{$address};
1516	}
1517	if (exists $mailmap->{addresses}->{$address}) {
1518	    $real_address = $mailmap->{addresses}->{$address};
1519	}
1520    }
1521    return format_email($real_name, $real_address, 1);
1522}
1523
1524sub mailmap {
1525    my (@addresses) = @_;
1526
1527    my @mapped_emails = ();
1528    foreach my $line (@addresses) {
1529	push(@mapped_emails, mailmap_email($line));
1530    }
1531    merge_by_realname(@mapped_emails) if ($email_use_mailmap);
1532    return @mapped_emails;
1533}
1534
1535sub merge_by_realname {
1536    my %address_map;
1537    my (@emails) = @_;
1538
1539    foreach my $email (@emails) {
1540	my ($name, $address) = parse_email($email);
1541	if (exists $address_map{$name}) {
1542	    $address = $address_map{$name};
1543	    $email = format_email($name, $address, 1);
1544	} else {
1545	    $address_map{$name} = $address;
1546	}
1547    }
1548}
1549
1550sub git_execute_cmd {
1551    my ($cmd) = @_;
1552    my @lines = ();
1553
1554    my $output = `$cmd`;
1555    $output =~ s/^\s*//gm;
1556    @lines = split("\n", $output);
1557
1558    return @lines;
1559}
1560
1561sub hg_execute_cmd {
1562    my ($cmd) = @_;
1563    my @lines = ();
1564
1565    my $output = `$cmd`;
1566    @lines = split("\n", $output);
1567
1568    return @lines;
1569}
1570
1571sub extract_formatted_signatures {
1572    my (@signature_lines) = @_;
1573
1574    my @type = @signature_lines;
1575
1576    s/\s*(.*):.*/$1/ for (@type);
1577
1578    # cut -f2- -d":"
1579    s/\s*.*:\s*(.+)\s*/$1/ for (@signature_lines);
1580
1581## Reformat email addresses (with names) to avoid badly written signatures
1582
1583    foreach my $signer (@signature_lines) {
1584	$signer = deduplicate_email($signer);
1585    }
1586
1587    return (\@type, \@signature_lines);
1588}
1589
1590sub vcs_find_signers {
1591    my ($cmd, $file) = @_;
1592    my $commits;
1593    my @lines = ();
1594    my @signatures = ();
1595    my @authors = ();
1596    my @stats = ();
1597
1598    @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1599
1600    my $pattern = $VCS_cmds{"commit_pattern"};
1601    my $author_pattern = $VCS_cmds{"author_pattern"};
1602    my $stat_pattern = $VCS_cmds{"stat_pattern"};
1603
1604    $stat_pattern =~ s/(\$\w+)/$1/eeg;		#interpolate $stat_pattern
1605
1606    $commits = grep(/$pattern/, @lines);	# of commits
1607
1608    @authors = grep(/$author_pattern/, @lines);
1609    @signatures = grep(/^[ \t]*${signature_pattern}.*\@.*$/, @lines);
1610    @stats = grep(/$stat_pattern/, @lines);
1611
1612#    print("stats: <@stats>\n");
1613
1614    return (0, \@signatures, \@authors, \@stats) if !@signatures;
1615
1616    save_commits_by_author(@lines) if ($interactive);
1617    save_commits_by_signer(@lines) if ($interactive);
1618
1619    if (!$email_git_penguin_chiefs) {
1620	@signatures = grep(!/${penguin_chiefs}/i, @signatures);
1621    }
1622
1623    my ($author_ref, $authors_ref) = extract_formatted_signatures(@authors);
1624    my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
1625
1626    return ($commits, $signers_ref, $authors_ref, \@stats);
1627}
1628
1629sub vcs_find_author {
1630    my ($cmd) = @_;
1631    my @lines = ();
1632
1633    @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1634
1635    if (!$email_git_penguin_chiefs) {
1636	@lines = grep(!/${penguin_chiefs}/i, @lines);
1637    }
1638
1639    return @lines if !@lines;
1640
1641    my @authors = ();
1642    foreach my $line (@lines) {
1643	if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1644	    my $author = $1;
1645	    my ($name, $address) = parse_email($author);
1646	    $author = format_email($name, $address, 1);
1647	    push(@authors, $author);
1648	}
1649    }
1650
1651    save_commits_by_author(@lines) if ($interactive);
1652    save_commits_by_signer(@lines) if ($interactive);
1653
1654    return @authors;
1655}
1656
1657sub vcs_save_commits {
1658    my ($cmd) = @_;
1659    my @lines = ();
1660    my @commits = ();
1661
1662    @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1663
1664    foreach my $line (@lines) {
1665	if ($line =~ m/$VCS_cmds{"blame_commit_pattern"}/) {
1666	    push(@commits, $1);
1667	}
1668    }
1669
1670    return @commits;
1671}
1672
1673sub vcs_blame {
1674    my ($file) = @_;
1675    my $cmd;
1676    my @commits = ();
1677
1678    return @commits if (!(-f $file));
1679
1680    if (@range && $VCS_cmds{"blame_range_cmd"} eq "") {
1681	my @all_commits = ();
1682
1683	$cmd = $VCS_cmds{"blame_file_cmd"};
1684	$cmd =~ s/(\$\w+)/$1/eeg;		#interpolate $cmd
1685	@all_commits = vcs_save_commits($cmd);
1686
1687	foreach my $file_range_diff (@range) {
1688	    next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1689	    my $diff_file = $1;
1690	    my $diff_start = $2;
1691	    my $diff_length = $3;
1692	    next if ("$file" ne "$diff_file");
1693	    for (my $i = $diff_start; $i < $diff_start + $diff_length; $i++) {
1694		push(@commits, $all_commits[$i]);
1695	    }
1696	}
1697    } elsif (@range) {
1698	foreach my $file_range_diff (@range) {
1699	    next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1700	    my $diff_file = $1;
1701	    my $diff_start = $2;
1702	    my $diff_length = $3;
1703	    next if ("$file" ne "$diff_file");
1704	    $cmd = $VCS_cmds{"blame_range_cmd"};
1705	    $cmd =~ s/(\$\w+)/$1/eeg;		#interpolate $cmd
1706	    push(@commits, vcs_save_commits($cmd));
1707	}
1708    } else {
1709	$cmd = $VCS_cmds{"blame_file_cmd"};
1710	$cmd =~ s/(\$\w+)/$1/eeg;		#interpolate $cmd
1711	@commits = vcs_save_commits($cmd);
1712    }
1713
1714    foreach my $commit (@commits) {
1715	$commit =~ s/^\^//g;
1716    }
1717
1718    return @commits;
1719}
1720
1721my $printed_novcs = 0;
1722sub vcs_exists {
1723    %VCS_cmds = %VCS_cmds_git;
1724    return 1 if eval $VCS_cmds{"available"};
1725    %VCS_cmds = %VCS_cmds_hg;
1726    return 2 if eval $VCS_cmds{"available"};
1727    %VCS_cmds = ();
1728    if (!$printed_novcs && $email_git) {
1729	warn("$P: No supported VCS found.  Add --nogit to options?\n");
1730	warn("Using a git repository produces better results.\n");
1731	warn("Try Linus Torvalds' latest git repository using:\n");
1732	warn("git clone git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git\n");
1733	$printed_novcs = 1;
1734    }
1735    return 0;
1736}
1737
1738sub vcs_is_git {
1739    vcs_exists();
1740    return $vcs_used == 1;
1741}
1742
1743sub vcs_is_hg {
1744    return $vcs_used == 2;
1745}
1746
1747sub vcs_add_commit_signers {
1748    return if (!vcs_exists());
1749
1750    my ($commit, $desc) = @_;
1751    my $commit_count = 0;
1752    my $commit_authors_ref;
1753    my $commit_signers_ref;
1754    my $stats_ref;
1755    my @commit_authors = ();
1756    my @commit_signers = ();
1757    my $cmd;
1758
1759    $cmd = $VCS_cmds{"find_commit_signers_cmd"};
1760    $cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
1761
1762    ($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, "");
1763    @commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
1764    @commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
1765
1766    foreach my $signer (@commit_signers) {
1767	$signer = deduplicate_email($signer);
1768    }
1769
1770    vcs_assign($desc, 1, @commit_signers);
1771}
1772
1773sub interactive_get_maintainers {
1774    my ($list_ref) = @_;
1775    my @list = @$list_ref;
1776
1777    vcs_exists();
1778
1779    my %selected;
1780    my %authored;
1781    my %signed;
1782    my $count = 0;
1783    my $maintained = 0;
1784    foreach my $entry (@list) {
1785	$maintained = 1 if ($entry->[1] =~ /^(maintainer|supporter)/i);
1786	$selected{$count} = 1;
1787	$authored{$count} = 0;
1788	$signed{$count} = 0;
1789	$count++;
1790    }
1791
1792    #menu loop
1793    my $done = 0;
1794    my $print_options = 0;
1795    my $redraw = 1;
1796    while (!$done) {
1797	$count = 0;
1798	if ($redraw) {
1799	    printf STDERR "\n%1s %2s %-65s",
1800			  "*", "#", "email/list and role:stats";
1801	    if ($email_git ||
1802		($email_git_fallback && !$maintained) ||
1803		$email_git_blame) {
1804		print STDERR "auth sign";
1805	    }
1806	    print STDERR "\n";
1807	    foreach my $entry (@list) {
1808		my $email = $entry->[0];
1809		my $role = $entry->[1];
1810		my $sel = "";
1811		$sel = "*" if ($selected{$count});
1812		my $commit_author = $commit_author_hash{$email};
1813		my $commit_signer = $commit_signer_hash{$email};
1814		my $authored = 0;
1815		my $signed = 0;
1816		$authored++ for (@{$commit_author});
1817		$signed++ for (@{$commit_signer});
1818		printf STDERR "%1s %2d %-65s", $sel, $count + 1, $email;
1819		printf STDERR "%4d %4d", $authored, $signed
1820		    if ($authored > 0 || $signed > 0);
1821		printf STDERR "\n     %s\n", $role;
1822		if ($authored{$count}) {
1823		    my $commit_author = $commit_author_hash{$email};
1824		    foreach my $ref (@{$commit_author}) {
1825			print STDERR "     Author: @{$ref}[1]\n";
1826		    }
1827		}
1828		if ($signed{$count}) {
1829		    my $commit_signer = $commit_signer_hash{$email};
1830		    foreach my $ref (@{$commit_signer}) {
1831			print STDERR "     @{$ref}[2]: @{$ref}[1]\n";
1832		    }
1833		}
1834
1835		$count++;
1836	    }
1837	}
1838	my $date_ref = \$email_git_since;
1839	$date_ref = \$email_hg_since if (vcs_is_hg());
1840	if ($print_options) {
1841	    $print_options = 0;
1842	    if (vcs_exists()) {
1843		print STDERR <<EOT
1844
1845Version Control options:
1846g  use git history      [$email_git]
1847gf use git-fallback     [$email_git_fallback]
1848b  use git blame        [$email_git_blame]
1849bs use blame signatures [$email_git_blame_signatures]
1850c# minimum commits      [$email_git_min_signatures]
1851%# min percent          [$email_git_min_percent]
1852d# history to use       [$$date_ref]
1853x# max maintainers      [$email_git_max_maintainers]
1854t  all signature types  [$email_git_all_signature_types]
1855m  use .mailmap         [$email_use_mailmap]
1856EOT
1857	    }
1858	    print STDERR <<EOT
1859
1860Additional options:
18610  toggle all
1862tm toggle maintainers
1863tg toggle git entries
1864tl toggle open list entries
1865ts toggle subscriber list entries
1866f  emails in file       [$email_file_emails]
1867k  keywords in file     [$keywords]
1868r  remove duplicates    [$email_remove_duplicates]
1869p# pattern match depth  [$pattern_depth]
1870EOT
1871	}
1872	print STDERR
1873"\n#(toggle), A#(author), S#(signed) *(all), ^(none), O(options), Y(approve): ";
1874
1875	my $input = <STDIN>;
1876	chomp($input);
1877
1878	$redraw = 1;
1879	my $rerun = 0;
1880	my @wish = split(/[, ]+/, $input);
1881	foreach my $nr (@wish) {
1882	    $nr = lc($nr);
1883	    my $sel = substr($nr, 0, 1);
1884	    my $str = substr($nr, 1);
1885	    my $val = 0;
1886	    $val = $1 if $str =~ /^(\d+)$/;
1887
1888	    if ($sel eq "y") {
1889		$interactive = 0;
1890		$done = 1;
1891		$output_rolestats = 0;
1892		$output_roles = 0;
1893		last;
1894	    } elsif ($nr =~ /^\d+$/ && $nr > 0 && $nr <= $count) {
1895		$selected{$nr - 1} = !$selected{$nr - 1};
1896	    } elsif ($sel eq "*" || $sel eq '^') {
1897		my $toggle = 0;
1898		$toggle = 1 if ($sel eq '*');
1899		for (my $i = 0; $i < $count; $i++) {
1900		    $selected{$i} = $toggle;
1901		}
1902	    } elsif ($sel eq "0") {
1903		for (my $i = 0; $i < $count; $i++) {
1904		    $selected{$i} = !$selected{$i};
1905		}
1906	    } elsif ($sel eq "t") {
1907		if (lc($str) eq "m") {
1908		    for (my $i = 0; $i < $count; $i++) {
1909			$selected{$i} = !$selected{$i}
1910			    if ($list[$i]->[1] =~ /^(maintainer|supporter)/i);
1911		    }
1912		} elsif (lc($str) eq "g") {
1913		    for (my $i = 0; $i < $count; $i++) {
1914			$selected{$i} = !$selected{$i}
1915			    if ($list[$i]->[1] =~ /^(author|commit|signer)/i);
1916		    }
1917		} elsif (lc($str) eq "l") {
1918		    for (my $i = 0; $i < $count; $i++) {
1919			$selected{$i} = !$selected{$i}
1920			    if ($list[$i]->[1] =~ /^(open list)/i);
1921		    }
1922		} elsif (lc($str) eq "s") {
1923		    for (my $i = 0; $i < $count; $i++) {
1924			$selected{$i} = !$selected{$i}
1925			    if ($list[$i]->[1] =~ /^(subscriber list)/i);
1926		    }
1927		}
1928	    } elsif ($sel eq "a") {
1929		if ($val > 0 && $val <= $count) {
1930		    $authored{$val - 1} = !$authored{$val - 1};
1931		} elsif ($str eq '*' || $str eq '^') {
1932		    my $toggle = 0;
1933		    $toggle = 1 if ($str eq '*');
1934		    for (my $i = 0; $i < $count; $i++) {
1935			$authored{$i} = $toggle;
1936		    }
1937		}
1938	    } elsif ($sel eq "s") {
1939		if ($val > 0 && $val <= $count) {
1940		    $signed{$val - 1} = !$signed{$val - 1};
1941		} elsif ($str eq '*' || $str eq '^') {
1942		    my $toggle = 0;
1943		    $toggle = 1 if ($str eq '*');
1944		    for (my $i = 0; $i < $count; $i++) {
1945			$signed{$i} = $toggle;
1946		    }
1947		}
1948	    } elsif ($sel eq "o") {
1949		$print_options = 1;
1950		$redraw = 1;
1951	    } elsif ($sel eq "g") {
1952		if ($str eq "f") {
1953		    bool_invert(\$email_git_fallback);
1954		} else {
1955		    bool_invert(\$email_git);
1956		}
1957		$rerun = 1;
1958	    } elsif ($sel eq "b") {
1959		if ($str eq "s") {
1960		    bool_invert(\$email_git_blame_signatures);
1961		} else {
1962		    bool_invert(\$email_git_blame);
1963		}
1964		$rerun = 1;
1965	    } elsif ($sel eq "c") {
1966		if ($val > 0) {
1967		    $email_git_min_signatures = $val;
1968		    $rerun = 1;
1969		}
1970	    } elsif ($sel eq "x") {
1971		if ($val > 0) {
1972		    $email_git_max_maintainers = $val;
1973		    $rerun = 1;
1974		}
1975	    } elsif ($sel eq "%") {
1976		if ($str ne "" && $val >= 0) {
1977		    $email_git_min_percent = $val;
1978		    $rerun = 1;
1979		}
1980	    } elsif ($sel eq "d") {
1981		if (vcs_is_git()) {
1982		    $email_git_since = $str;
1983		} elsif (vcs_is_hg()) {
1984		    $email_hg_since = $str;
1985		}
1986		$rerun = 1;
1987	    } elsif ($sel eq "t") {
1988		bool_invert(\$email_git_all_signature_types);
1989		$rerun = 1;
1990	    } elsif ($sel eq "f") {
1991		bool_invert(\$email_file_emails);
1992		$rerun = 1;
1993	    } elsif ($sel eq "r") {
1994		bool_invert(\$email_remove_duplicates);
1995		$rerun = 1;
1996	    } elsif ($sel eq "m") {
1997		bool_invert(\$email_use_mailmap);
1998		read_mailmap();
1999		$rerun = 1;
2000	    } elsif ($sel eq "k") {
2001		bool_invert(\$keywords);
2002		$rerun = 1;
2003	    } elsif ($sel eq "p") {
2004		if ($str ne "" && $val >= 0) {
2005		    $pattern_depth = $val;
2006		    $rerun = 1;
2007		}
2008	    } elsif ($sel eq "h" || $sel eq "?") {
2009		print STDERR <<EOT
2010
2011Interactive mode allows you to select the various maintainers, submitters,
2012commit signers and mailing lists that could be CC'd on a patch.
2013
2014Any *'d entry is selected.
2015
2016If you have git or hg installed, you can choose to summarize the commit
2017history of files in the patch.  Also, each line of the current file can
2018be matched to its commit author and that commits signers with blame.
2019
2020Various knobs exist to control the length of time for active commit
2021tracking, the maximum number of commit authors and signers to add,
2022and such.
2023
2024Enter selections at the prompt until you are satisfied that the selected
2025maintainers are appropriate.  You may enter multiple selections separated
2026by either commas or spaces.
2027
2028EOT
2029	    } else {
2030		print STDERR "invalid option: '$nr'\n";
2031		$redraw = 0;
2032	    }
2033	}
2034	if ($rerun) {
2035	    print STDERR "git-blame can be very slow, please have patience..."
2036		if ($email_git_blame);
2037	    goto &get_maintainers;
2038	}
2039    }
2040
2041    #drop not selected entries
2042    $count = 0;
2043    my @new_emailto = ();
2044    foreach my $entry (@list) {
2045	if ($selected{$count}) {
2046	    push(@new_emailto, $list[$count]);
2047	}
2048	$count++;
2049    }
2050    return @new_emailto;
2051}
2052
2053sub bool_invert {
2054    my ($bool_ref) = @_;
2055
2056    if ($$bool_ref) {
2057	$$bool_ref = 0;
2058    } else {
2059	$$bool_ref = 1;
2060    }
2061}
2062
2063sub deduplicate_email {
2064    my ($email) = @_;
2065
2066    my $matched = 0;
2067    my ($name, $address) = parse_email($email);
2068    $email = format_email($name, $address, 1);
2069    $email = mailmap_email($email);
2070
2071    return $email if (!$email_remove_duplicates);
2072
2073    ($name, $address) = parse_email($email);
2074
2075    if ($name ne "" && $deduplicate_name_hash{lc($name)}) {
2076	$name = $deduplicate_name_hash{lc($name)}->[0];
2077	$address = $deduplicate_name_hash{lc($name)}->[1];
2078	$matched = 1;
2079    } elsif ($deduplicate_address_hash{lc($address)}) {
2080	$name = $deduplicate_address_hash{lc($address)}->[0];
2081	$address = $deduplicate_address_hash{lc($address)}->[1];
2082	$matched = 1;
2083    }
2084    if (!$matched) {
2085	$deduplicate_name_hash{lc($name)} = [ $name, $address ];
2086	$deduplicate_address_hash{lc($address)} = [ $name, $address ];
2087    }
2088    $email = format_email($name, $address, 1);
2089    $email = mailmap_email($email);
2090    return $email;
2091}
2092
2093sub save_commits_by_author {
2094    my (@lines) = @_;
2095
2096    my @authors = ();
2097    my @commits = ();
2098    my @subjects = ();
2099
2100    foreach my $line (@lines) {
2101	if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
2102	    my $author = $1;
2103	    $author = deduplicate_email($author);
2104	    push(@authors, $author);
2105	}
2106	push(@commits, $1) if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
2107	push(@subjects, $1) if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
2108    }
2109
2110    for (my $i = 0; $i < @authors; $i++) {
2111	my $exists = 0;
2112	foreach my $ref(@{$commit_author_hash{$authors[$i]}}) {
2113	    if (@{$ref}[0] eq $commits[$i] &&
2114		@{$ref}[1] eq $subjects[$i]) {
2115		$exists = 1;
2116		last;
2117	    }
2118	}
2119	if (!$exists) {
2120	    push(@{$commit_author_hash{$authors[$i]}},
2121		 [ ($commits[$i], $subjects[$i]) ]);
2122	}
2123    }
2124}
2125
2126sub save_commits_by_signer {
2127    my (@lines) = @_;
2128
2129    my $commit = "";
2130    my $subject = "";
2131
2132    foreach my $line (@lines) {
2133	$commit = $1 if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
2134	$subject = $1 if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
2135	if ($line =~ /^[ \t]*${signature_pattern}.*\@.*$/) {
2136	    my @signatures = ($line);
2137	    my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
2138	    my @types = @$types_ref;
2139	    my @signers = @$signers_ref;
2140
2141	    my $type = $types[0];
2142	    my $signer = $signers[0];
2143
2144	    $signer = deduplicate_email($signer);
2145
2146	    my $exists = 0;
2147	    foreach my $ref(@{$commit_signer_hash{$signer}}) {
2148		if (@{$ref}[0] eq $commit &&
2149		    @{$ref}[1] eq $subject &&
2150		    @{$ref}[2] eq $type) {
2151		    $exists = 1;
2152		    last;
2153		}
2154	    }
2155	    if (!$exists) {
2156		push(@{$commit_signer_hash{$signer}},
2157		     [ ($commit, $subject, $type) ]);
2158	    }
2159	}
2160    }
2161}
2162
2163sub vcs_assign {
2164    my ($role, $divisor, @lines) = @_;
2165
2166    my %hash;
2167    my $count = 0;
2168
2169    return if (@lines <= 0);
2170
2171    if ($divisor <= 0) {
2172	warn("Bad divisor in " . (caller(0))[3] . ": $divisor\n");
2173	$divisor = 1;
2174    }
2175
2176    @lines = mailmap(@lines);
2177
2178    return if (@lines <= 0);
2179
2180    @lines = sort(@lines);
2181
2182    # uniq -c
2183    $hash{$_}++ for @lines;
2184
2185    # sort -rn
2186    foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
2187	my $sign_offs = $hash{$line};
2188	my $percent = $sign_offs * 100 / $divisor;
2189
2190	$percent = 100 if ($percent > 100);
2191	next if (ignore_email_address($line));
2192	$count++;
2193	last if ($sign_offs < $email_git_min_signatures ||
2194		 $count > $email_git_max_maintainers ||
2195		 $percent < $email_git_min_percent);
2196	push_email_address($line, '');
2197	if ($output_rolestats) {
2198	    my $fmt_percent = sprintf("%.0f", $percent);
2199	    add_role($line, "$role:$sign_offs/$divisor=$fmt_percent%");
2200	} else {
2201	    add_role($line, $role);
2202	}
2203    }
2204}
2205
2206sub vcs_file_signoffs {
2207    my ($file) = @_;
2208
2209    my $authors_ref;
2210    my $signers_ref;
2211    my $stats_ref;
2212    my @authors = ();
2213    my @signers = ();
2214    my @stats = ();
2215    my $commits;
2216
2217    $vcs_used = vcs_exists();
2218    return if (!$vcs_used);
2219
2220    my $cmd = $VCS_cmds{"find_signers_cmd"};
2221    $cmd =~ s/(\$\w+)/$1/eeg;		# interpolate $cmd
2222
2223    ($commits, $signers_ref, $authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2224
2225    @signers = @{$signers_ref} if defined $signers_ref;
2226    @authors = @{$authors_ref} if defined $authors_ref;
2227    @stats = @{$stats_ref} if defined $stats_ref;
2228
2229#    print("commits: <$commits>\nsigners:<@signers>\nauthors: <@authors>\nstats: <@stats>\n");
2230
2231    foreach my $signer (@signers) {
2232	$signer = deduplicate_email($signer);
2233    }
2234
2235    vcs_assign("commit_signer", $commits, @signers);
2236    vcs_assign("authored", $commits, @authors);
2237    if ($#authors == $#stats) {
2238	my $stat_pattern = $VCS_cmds{"stat_pattern"};
2239	$stat_pattern =~ s/(\$\w+)/$1/eeg;	#interpolate $stat_pattern
2240
2241	my $added = 0;
2242	my $deleted = 0;
2243	for (my $i = 0; $i <= $#stats; $i++) {
2244	    if ($stats[$i] =~ /$stat_pattern/) {
2245		$added += $1;
2246		$deleted += $2;
2247	    }
2248	}
2249	my @tmp_authors = uniq(@authors);
2250	foreach my $author (@tmp_authors) {
2251	    $author = deduplicate_email($author);
2252	}
2253	@tmp_authors = uniq(@tmp_authors);
2254	my @list_added = ();
2255	my @list_deleted = ();
2256	foreach my $author (@tmp_authors) {
2257	    my $auth_added = 0;
2258	    my $auth_deleted = 0;
2259	    for (my $i = 0; $i <= $#stats; $i++) {
2260		if ($author eq deduplicate_email($authors[$i]) &&
2261		    $stats[$i] =~ /$stat_pattern/) {
2262		    $auth_added += $1;
2263		    $auth_deleted += $2;
2264		}
2265	    }
2266	    for (my $i = 0; $i < $auth_added; $i++) {
2267		push(@list_added, $author);
2268	    }
2269	    for (my $i = 0; $i < $auth_deleted; $i++) {
2270		push(@list_deleted, $author);
2271	    }
2272	}
2273	vcs_assign("added_lines", $added, @list_added);
2274	vcs_assign("removed_lines", $deleted, @list_deleted);
2275    }
2276}
2277
2278sub vcs_file_blame {
2279    my ($file) = @_;
2280
2281    my @signers = ();
2282    my @all_commits = ();
2283    my @commits = ();
2284    my $total_commits;
2285    my $total_lines;
2286
2287    $vcs_used = vcs_exists();
2288    return if (!$vcs_used);
2289
2290    @all_commits = vcs_blame($file);
2291    @commits = uniq(@all_commits);
2292    $total_commits = @commits;
2293    $total_lines = @all_commits;
2294
2295    if ($email_git_blame_signatures) {
2296	if (vcs_is_hg()) {
2297	    my $commit_count;
2298	    my $commit_authors_ref;
2299	    my $commit_signers_ref;
2300	    my $stats_ref;
2301	    my @commit_authors = ();
2302	    my @commit_signers = ();
2303	    my $commit = join(" -r ", @commits);
2304	    my $cmd;
2305
2306	    $cmd = $VCS_cmds{"find_commit_signers_cmd"};
2307	    $cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
2308
2309	    ($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2310	    @commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
2311	    @commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
2312
2313	    push(@signers, @commit_signers);
2314	} else {
2315	    foreach my $commit (@commits) {
2316		my $commit_count;
2317		my $commit_authors_ref;
2318		my $commit_signers_ref;
2319		my $stats_ref;
2320		my @commit_authors = ();
2321		my @commit_signers = ();
2322		my $cmd;
2323
2324		$cmd = $VCS_cmds{"find_commit_signers_cmd"};
2325		$cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
2326
2327		($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2328		@commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
2329		@commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
2330
2331		push(@signers, @commit_signers);
2332	    }
2333	}
2334    }
2335
2336    if ($from_filename) {
2337	if ($output_rolestats) {
2338	    my @blame_signers;
2339	    if (vcs_is_hg()) {{		# Double brace for last exit
2340		my $commit_count;
2341		my @commit_signers = ();
2342		@commits = uniq(@commits);
2343		@commits = sort(@commits);
2344		my $commit = join(" -r ", @commits);
2345		my $cmd;
2346
2347		$cmd = $VCS_cmds{"find_commit_author_cmd"};
2348		$cmd =~ s/(\$\w+)/$1/eeg;	#substitute variables in $cmd
2349
2350		my @lines = ();
2351
2352		@lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
2353
2354		if (!$email_git_penguin_chiefs) {
2355		    @lines = grep(!/${penguin_chiefs}/i, @lines);
2356		}
2357
2358		last if !@lines;
2359
2360		my @authors = ();
2361		foreach my $line (@lines) {
2362		    if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
2363			my $author = $1;
2364			$author = deduplicate_email($author);
2365			push(@authors, $author);
2366		    }
2367		}
2368
2369		save_commits_by_author(@lines) if ($interactive);
2370		save_commits_by_signer(@lines) if ($interactive);
2371
2372		push(@signers, @authors);
2373	    }}
2374	    else {
2375		foreach my $commit (@commits) {
2376		    my $i;
2377		    my $cmd = $VCS_cmds{"find_commit_author_cmd"};
2378		    $cmd =~ s/(\$\w+)/$1/eeg;	#interpolate $cmd
2379		    my @author = vcs_find_author($cmd);
2380		    next if !@author;
2381
2382		    my $formatted_author = deduplicate_email($author[0]);
2383
2384		    my $count = grep(/$commit/, @all_commits);
2385		    for ($i = 0; $i < $count ; $i++) {
2386			push(@blame_signers, $formatted_author);
2387		    }
2388		}
2389	    }
2390	    if (@blame_signers) {
2391		vcs_assign("authored lines", $total_lines, @blame_signers);
2392	    }
2393	}
2394	foreach my $signer (@signers) {
2395	    $signer = deduplicate_email($signer);
2396	}
2397	vcs_assign("commits", $total_commits, @signers);
2398    } else {
2399	foreach my $signer (@signers) {
2400	    $signer = deduplicate_email($signer);
2401	}
2402	vcs_assign("modified commits", $total_commits, @signers);
2403    }
2404}
2405
2406sub vcs_file_exists {
2407    my ($file) = @_;
2408
2409    my $exists;
2410
2411    my $vcs_used = vcs_exists();
2412    return 0 if (!$vcs_used);
2413
2414    my $cmd = $VCS_cmds{"file_exists_cmd"};
2415    $cmd =~ s/(\$\w+)/$1/eeg;		# interpolate $cmd
2416    $cmd .= " 2>&1";
2417    $exists = &{$VCS_cmds{"execute_cmd"}}($cmd);
2418
2419    return 0 if ($? != 0);
2420
2421    return $exists;
2422}
2423
2424sub vcs_list_files {
2425    my ($file) = @_;
2426
2427    my @lsfiles = ();
2428
2429    my $vcs_used = vcs_exists();
2430    return 0 if (!$vcs_used);
2431
2432    my $cmd = $VCS_cmds{"list_files_cmd"};
2433    $cmd =~ s/(\$\w+)/$1/eeg;   # interpolate $cmd
2434    @lsfiles = &{$VCS_cmds{"execute_cmd"}}($cmd);
2435
2436    return () if ($? != 0);
2437
2438    return @lsfiles;
2439}
2440
2441sub uniq {
2442    my (@parms) = @_;
2443
2444    my %saw;
2445    @parms = grep(!$saw{$_}++, @parms);
2446    return @parms;
2447}
2448
2449sub sort_and_uniq {
2450    my (@parms) = @_;
2451
2452    my %saw;
2453    @parms = sort @parms;
2454    @parms = grep(!$saw{$_}++, @parms);
2455    return @parms;
2456}
2457
2458sub clean_file_emails {
2459    my (@file_emails) = @_;
2460    my @fmt_emails = ();
2461
2462    foreach my $email (@file_emails) {
2463	$email =~ s/[\(\<\{]{0,1}([A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+)[\)\>\}]{0,1}/\<$1\>/g;
2464	my ($name, $address) = parse_email($email);
 
 
 
2465
2466	# Strip quotes for easier processing, format_email will add them back
2467	$name =~ s/^"(.*)"$/$1/;
2468
2469	# Split into name-like parts and remove stray punctuation particles
2470	my @nw = split(/[^\p{L}\'\,\.\+-]/, $name);
2471	@nw = grep(!/^[\'\,\.\+-]$/, @nw);
2472
2473	# Make a best effort to extract the name, and only the name, by taking
2474	# only the last two names, or in the case of obvious initials, the last
2475	# three names.
2476	if (@nw > 2) {
2477	    my $first = $nw[@nw - 3];
2478	    my $middle = $nw[@nw - 2];
2479	    my $last = $nw[@nw - 1];
2480
2481	    if (((length($first) == 1 && $first =~ m/\p{L}/) ||
2482		 (length($first) == 2 && substr($first, -1) eq ".")) ||
2483		(length($middle) == 1 ||
2484		 (length($middle) == 2 && substr($middle, -1) eq "."))) {
2485		$name = "$first $middle $last";
2486	    } else {
2487		$name = "$middle $last";
2488	    }
2489	} else {
2490	    $name = "@nw";
2491	}
2492
2493	if (substr($name, -1) =~ /[,\.]/) {
2494	    $name = substr($name, 0, length($name) - 1);
 
 
2495	}
2496
2497	if (substr($name, 0, 1) =~ /[,\.]/) {
2498	    $name = substr($name, 1, length($name) - 1);
 
 
2499	}
2500
2501	my $fmt_email = format_email($name, $address, $email_usename);
2502	push(@fmt_emails, $fmt_email);
2503    }
2504    return @fmt_emails;
2505}
2506
2507sub merge_email {
2508    my @lines;
2509    my %saw;
2510
2511    for (@_) {
2512	my ($address, $role) = @$_;
2513	if (!$saw{$address}) {
2514	    if ($output_roles) {
2515		push(@lines, "$address ($role)");
2516	    } else {
2517		push(@lines, $address);
2518	    }
2519	    $saw{$address} = 1;
2520	}
2521    }
2522
2523    return @lines;
2524}
2525
2526sub output {
2527    my (@parms) = @_;
2528
2529    if ($output_multiline) {
2530	foreach my $line (@parms) {
2531	    print("${line}\n");
2532	}
2533    } else {
2534	print(join($output_separator, @parms));
2535	print("\n");
2536    }
2537}
2538
2539my $rfc822re;
2540
2541sub make_rfc822re {
2542#   Basic lexical tokens are specials, domain_literal, quoted_string, atom, and
2543#   comment.  We must allow for rfc822_lwsp (or comments) after each of these.
2544#   This regexp will only work on addresses which have had comments stripped
2545#   and replaced with rfc822_lwsp.
2546
2547    my $specials = '()<>@,;:\\\\".\\[\\]';
2548    my $controls = '\\000-\\037\\177';
2549
2550    my $dtext = "[^\\[\\]\\r\\\\]";
2551    my $domain_literal = "\\[(?:$dtext|\\\\.)*\\]$rfc822_lwsp*";
2552
2553    my $quoted_string = "\"(?:[^\\\"\\r\\\\]|\\\\.|$rfc822_lwsp)*\"$rfc822_lwsp*";
2554
2555#   Use zero-width assertion to spot the limit of an atom.  A simple
2556#   $rfc822_lwsp* causes the regexp engine to hang occasionally.
2557    my $atom = "[^$specials $controls]+(?:$rfc822_lwsp+|\\Z|(?=[\\[\"$specials]))";
2558    my $word = "(?:$atom|$quoted_string)";
2559    my $localpart = "$word(?:\\.$rfc822_lwsp*$word)*";
2560
2561    my $sub_domain = "(?:$atom|$domain_literal)";
2562    my $domain = "$sub_domain(?:\\.$rfc822_lwsp*$sub_domain)*";
2563
2564    my $addr_spec = "$localpart\@$rfc822_lwsp*$domain";
2565
2566    my $phrase = "$word*";
2567    my $route = "(?:\@$domain(?:,\@$rfc822_lwsp*$domain)*:$rfc822_lwsp*)";
2568    my $route_addr = "\\<$rfc822_lwsp*$route?$addr_spec\\>$rfc822_lwsp*";
2569    my $mailbox = "(?:$addr_spec|$phrase$route_addr)";
2570
2571    my $group = "$phrase:$rfc822_lwsp*(?:$mailbox(?:,\\s*$mailbox)*)?;\\s*";
2572    my $address = "(?:$mailbox|$group)";
2573
2574    return "$rfc822_lwsp*$address";
2575}
2576
2577sub rfc822_strip_comments {
2578    my $s = shift;
2579#   Recursively remove comments, and replace with a single space.  The simpler
2580#   regexps in the Email Addressing FAQ are imperfect - they will miss escaped
2581#   chars in atoms, for example.
2582
2583    while ($s =~ s/^((?:[^"\\]|\\.)*
2584                    (?:"(?:[^"\\]|\\.)*"(?:[^"\\]|\\.)*)*)
2585                    \((?:[^()\\]|\\.)*\)/$1 /osx) {}
2586    return $s;
2587}
2588
2589#   valid: returns true if the parameter is an RFC822 valid address
2590#
2591sub rfc822_valid {
2592    my $s = rfc822_strip_comments(shift);
2593
2594    if (!$rfc822re) {
2595        $rfc822re = make_rfc822re();
2596    }
2597
2598    return $s =~ m/^$rfc822re$/so && $s =~ m/^$rfc822_char*$/;
2599}
2600
2601#   validlist: In scalar context, returns true if the parameter is an RFC822
2602#              valid list of addresses.
2603#
2604#              In list context, returns an empty list on failure (an invalid
2605#              address was found); otherwise a list whose first element is the
2606#              number of addresses found and whose remaining elements are the
2607#              addresses.  This is needed to disambiguate failure (invalid)
2608#              from success with no addresses found, because an empty string is
2609#              a valid list.
2610
2611sub rfc822_validlist {
2612    my $s = rfc822_strip_comments(shift);
2613
2614    if (!$rfc822re) {
2615        $rfc822re = make_rfc822re();
2616    }
2617    # * null list items are valid according to the RFC
2618    # * the '1' business is to aid in distinguishing failure from no results
2619
2620    my @r;
2621    if ($s =~ m/^(?:$rfc822re)?(?:,(?:$rfc822re)?)*$/so &&
2622	$s =~ m/^$rfc822_char*$/) {
2623        while ($s =~ m/(?:^|,$rfc822_lwsp*)($rfc822re)/gos) {
2624            push(@r, $1);
2625        }
2626        return wantarray ? (scalar(@r), @r) : 1;
2627    }
2628    return wantarray ? () : 0;
2629}