]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blame - scripts/get_maintainer.pl
get_maintainer: add --no-foo options to --help
[mirror_ubuntu-bionic-kernel.git] / scripts / get_maintainer.pl
CommitLineData
cb7301c7
JP
1#!/usr/bin/perl -w
2# (c) 2007, Joe Perches <joe@perches.com>
3# created from checkpatch.pl
4#
5# Print selected MAINTAINERS information for
6# the files modified in a patch or for a file
7#
3bd7bf5f
RK
8# usage: perl scripts/get_maintainer.pl [OPTIONS] <patch>
9# perl scripts/get_maintainer.pl [OPTIONS] -f <file>
cb7301c7
JP
10#
11# Licensed under the terms of the GNU GPL License version 2
12
13use strict;
14
15my $P = $0;
7e1863af 16my $V = '0.26';
cb7301c7
JP
17
18use Getopt::Long qw(:config no_auto_abbrev);
19
20my $lk_path = "./";
21my $email = 1;
22my $email_usename = 1;
23my $email_maintainer = 1;
c1c3f2c9 24my $email_reviewer = 1;
cb7301c7
JP
25my $email_list = 1;
26my $email_subscriber_list = 0;
cb7301c7 27my $email_git_penguin_chiefs = 0;
e3e9d114 28my $email_git = 0;
0fa05599 29my $email_git_all_signature_types = 0;
60db31ac 30my $email_git_blame = 0;
683c6f8f 31my $email_git_blame_signatures = 1;
e3e9d114 32my $email_git_fallback = 1;
cb7301c7
JP
33my $email_git_min_signatures = 1;
34my $email_git_max_maintainers = 5;
afa81ee1 35my $email_git_min_percent = 5;
cb7301c7 36my $email_git_since = "1-year-ago";
60db31ac 37my $email_hg_since = "-365";
dace8e30 38my $interactive = 0;
11ecf53c 39my $email_remove_duplicates = 1;
b9e2331d 40my $email_use_mailmap = 1;
cb7301c7
JP
41my $output_multiline = 1;
42my $output_separator = ", ";
3c7385b8 43my $output_roles = 0;
7e1863af 44my $output_rolestats = 1;
364f68dc 45my $output_section_maxlen = 50;
cb7301c7
JP
46my $scm = 0;
47my $web = 0;
48my $subsystem = 0;
49my $status = 0;
dcf36a92 50my $keywords = 1;
4b76c9da 51my $sections = 0;
03372dbb 52my $file_emails = 0;
4a7fdb5f 53my $from_filename = 0;
3fb55652 54my $pattern_depth = 0;
cb7301c7
JP
55my $version = 0;
56my $help = 0;
57
683c6f8f
JP
58my $vcs_used = 0;
59
cb7301c7
JP
60my $exit = 0;
61
683c6f8f
JP
62my %commit_author_hash;
63my %commit_signer_hash;
dace8e30 64
cb7301c7 65my @penguin_chief = ();
e4d26b02 66push(@penguin_chief, "Linus Torvalds:torvalds\@linux-foundation.org");
cb7301c7 67#Andrew wants in on most everything - 2009/01/14
e4d26b02 68#push(@penguin_chief, "Andrew Morton:akpm\@linux-foundation.org");
cb7301c7
JP
69
70my @penguin_chief_names = ();
71foreach my $chief (@penguin_chief) {
72 if ($chief =~ m/^(.*):(.*)/) {
73 my $chief_name = $1;
74 my $chief_addr = $2;
75 push(@penguin_chief_names, $chief_name);
76 }
77}
e4d26b02
JP
78my $penguin_chiefs = "\(" . join("|", @penguin_chief_names) . "\)";
79
80# Signature types of people who are either
81# a) responsible for the code in question, or
82# b) familiar enough with it to give relevant feedback
83my @signature_tags = ();
84push(@signature_tags, "Signed-off-by:");
85push(@signature_tags, "Reviewed-by:");
86push(@signature_tags, "Acked-by:");
cb7301c7 87
7dea2681
JP
88my $signature_pattern = "\(" . join("|", @signature_tags) . "\)";
89
5f2441e9 90# rfc822 email address - preloaded methods go here.
1b5e1cf6 91my $rfc822_lwsp = "(?:(?:\\r\\n)?[ \\t])";
df4cc036 92my $rfc822_char = '[\\000-\\377]';
1b5e1cf6 93
60db31ac
JP
94# VCS command support: class-like functions and strings
95
96my %VCS_cmds;
97
98my %VCS_cmds_git = (
99 "execute_cmd" => \&git_execute_cmd,
ec83b616 100 "available" => '(which("git") ne "") && (-e ".git")',
683c6f8f 101 "find_signers_cmd" =>
ed128fea 102 "git log --no-color --follow --since=\$email_git_since " .
c9ecefea 103 '--numstat --no-merges ' .
683c6f8f
JP
104 '--format="GitCommit: %H%n' .
105 'GitAuthor: %an <%ae>%n' .
106 'GitDate: %aD%n' .
107 'GitSubject: %s%n' .
108 '%b%n"' .
109 " -- \$file",
110 "find_commit_signers_cmd" =>
111 "git log --no-color " .
c9ecefea 112 '--numstat ' .
683c6f8f
JP
113 '--format="GitCommit: %H%n' .
114 'GitAuthor: %an <%ae>%n' .
115 'GitDate: %aD%n' .
116 'GitSubject: %s%n' .
117 '%b%n"' .
118 " -1 \$commit",
119 "find_commit_author_cmd" =>
120 "git log --no-color " .
c9ecefea 121 '--numstat ' .
683c6f8f
JP
122 '--format="GitCommit: %H%n' .
123 'GitAuthor: %an <%ae>%n' .
124 'GitDate: %aD%n' .
125 'GitSubject: %s%n"' .
126 " -1 \$commit",
60db31ac
JP
127 "blame_range_cmd" => "git blame -l -L \$diff_start,+\$diff_length \$file",
128 "blame_file_cmd" => "git blame -l \$file",
683c6f8f 129 "commit_pattern" => "^GitCommit: ([0-9a-f]{40,40})",
dace8e30 130 "blame_commit_pattern" => "^([0-9a-f]+) ",
683c6f8f
JP
131 "author_pattern" => "^GitAuthor: (.*)",
132 "subject_pattern" => "^GitSubject: (.*)",
c9ecefea 133 "stat_pattern" => "^(\\d+)\\t(\\d+)\\t\$file\$",
60db31ac
JP
134);
135
136my %VCS_cmds_hg = (
137 "execute_cmd" => \&hg_execute_cmd,
138 "available" => '(which("hg") ne "") && (-d ".hg")',
139 "find_signers_cmd" =>
683c6f8f
JP
140 "hg log --date=\$email_hg_since " .
141 "--template='HgCommit: {node}\\n" .
142 "HgAuthor: {author}\\n" .
143 "HgSubject: {desc}\\n'" .
144 " -- \$file",
145 "find_commit_signers_cmd" =>
146 "hg log " .
147 "--template='HgSubject: {desc}\\n'" .
148 " -r \$commit",
149 "find_commit_author_cmd" =>
150 "hg log " .
151 "--template='HgCommit: {node}\\n" .
152 "HgAuthor: {author}\\n" .
153 "HgSubject: {desc|firstline}\\n'" .
154 " -r \$commit",
60db31ac 155 "blame_range_cmd" => "", # not supported
683c6f8f
JP
156 "blame_file_cmd" => "hg blame -n \$file",
157 "commit_pattern" => "^HgCommit: ([0-9a-f]{40,40})",
158 "blame_commit_pattern" => "^([ 0-9a-f]+):",
159 "author_pattern" => "^HgAuthor: (.*)",
160 "subject_pattern" => "^HgSubject: (.*)",
c9ecefea 161 "stat_pattern" => "^(\\d+)\t(\\d+)\t\$file\$",
60db31ac
JP
162);
163
bcde44ed
JP
164my $conf = which_conf(".get_maintainer.conf");
165if (-f $conf) {
368669da 166 my @conf_args;
bcde44ed
JP
167 open(my $conffile, '<', "$conf")
168 or warn "$P: Can't find a readable .get_maintainer.conf file $!\n";
169
368669da
JP
170 while (<$conffile>) {
171 my $line = $_;
172
173 $line =~ s/\s*\n?$//g;
174 $line =~ s/^\s*//g;
175 $line =~ s/\s+/ /g;
176
177 next if ($line =~ m/^\s*#/);
178 next if ($line =~ m/^\s*$/);
179
180 my @words = split(" ", $line);
181 foreach my $word (@words) {
182 last if ($word =~ m/^#/);
183 push (@conf_args, $word);
184 }
185 }
186 close($conffile);
187 unshift(@ARGV, @conf_args) if @conf_args;
188}
189
435de078
JP
190my @ignore_emails = ();
191my $ignore_file = which_conf(".get_maintainer.ignore");
192if (-f $ignore_file) {
193 open(my $ignore, '<', "$ignore_file")
194 or warn "$P: Can't find a readable .get_maintainer.ignore file $!\n";
195 while (<$ignore>) {
196 my $line = $_;
197
198 $line =~ s/\s*\n?$//;
199 $line =~ s/^\s*//;
200 $line =~ s/\s+$//;
201 $line =~ s/#.*$//;
202
203 next if ($line =~ m/^\s*$/);
204 if (rfc822_valid($line)) {
205 push(@ignore_emails, $line);
206 }
207 }
208 close($ignore);
209}
210
cb7301c7
JP
211if (!GetOptions(
212 'email!' => \$email,
213 'git!' => \$email_git,
e4d26b02 214 'git-all-signature-types!' => \$email_git_all_signature_types,
60db31ac 215 'git-blame!' => \$email_git_blame,
683c6f8f 216 'git-blame-signatures!' => \$email_git_blame_signatures,
e3e9d114 217 'git-fallback!' => \$email_git_fallback,
cb7301c7
JP
218 'git-chief-penguins!' => \$email_git_penguin_chiefs,
219 'git-min-signatures=i' => \$email_git_min_signatures,
220 'git-max-maintainers=i' => \$email_git_max_maintainers,
afa81ee1 221 'git-min-percent=i' => \$email_git_min_percent,
cb7301c7 222 'git-since=s' => \$email_git_since,
60db31ac 223 'hg-since=s' => \$email_hg_since,
dace8e30 224 'i|interactive!' => \$interactive,
11ecf53c 225 'remove-duplicates!' => \$email_remove_duplicates,
b9e2331d 226 'mailmap!' => \$email_use_mailmap,
cb7301c7 227 'm!' => \$email_maintainer,
c1c3f2c9 228 'r!' => \$email_reviewer,
cb7301c7
JP
229 'n!' => \$email_usename,
230 'l!' => \$email_list,
231 's!' => \$email_subscriber_list,
232 'multiline!' => \$output_multiline,
3c7385b8
JP
233 'roles!' => \$output_roles,
234 'rolestats!' => \$output_rolestats,
cb7301c7
JP
235 'separator=s' => \$output_separator,
236 'subsystem!' => \$subsystem,
237 'status!' => \$status,
238 'scm!' => \$scm,
239 'web!' => \$web,
3fb55652 240 'pattern-depth=i' => \$pattern_depth,
dcf36a92 241 'k|keywords!' => \$keywords,
4b76c9da 242 'sections!' => \$sections,
03372dbb 243 'fe|file-emails!' => \$file_emails,
4a7fdb5f 244 'f|file' => \$from_filename,
cb7301c7 245 'v|version' => \$version,
64f77f31 246 'h|help|usage' => \$help,
cb7301c7 247 )) {
3c7385b8 248 die "$P: invalid argument - use --help if necessary\n";
cb7301c7
JP
249}
250
251if ($help != 0) {
252 usage();
253 exit 0;
254}
255
256if ($version != 0) {
257 print("${P} ${V}\n");
258 exit 0;
259}
260
64f77f31
JP
261if (-t STDIN && !@ARGV) {
262 # We're talking to a terminal, but have no command line arguments.
263 die "$P: missing patchfile or -f file - use --help if necessary\n";
cb7301c7
JP
264}
265
683c6f8f
JP
266$output_multiline = 0 if ($output_separator ne ", ");
267$output_rolestats = 1 if ($interactive);
268$output_roles = 1 if ($output_rolestats);
3c7385b8 269
4b76c9da
JP
270if ($sections) {
271 $email = 0;
272 $email_list = 0;
273 $scm = 0;
274 $status = 0;
275 $subsystem = 0;
276 $web = 0;
277 $keywords = 0;
6ef1c52e 278 $interactive = 0;
4b76c9da
JP
279} else {
280 my $selections = $email + $scm + $status + $subsystem + $web;
281 if ($selections == 0) {
4b76c9da
JP
282 die "$P: Missing required option: email, scm, status, subsystem or web\n";
283 }
cb7301c7
JP
284}
285
f5492666 286if ($email &&
c1c3f2c9
JP
287 ($email_maintainer + $email_reviewer +
288 $email_list + $email_subscriber_list +
f5492666 289 $email_git + $email_git_penguin_chiefs + $email_git_blame) == 0) {
cb7301c7
JP
290 die "$P: Please select at least 1 email option\n";
291}
292
293if (!top_of_kernel_tree($lk_path)) {
294 die "$P: The current directory does not appear to be "
295 . "a linux kernel source tree.\n";
296}
297
298## Read MAINTAINERS for type/value pairs
299
300my @typevalue = ();
dcf36a92
JP
301my %keyword_hash;
302
22dd5b0c
SH
303open (my $maint, '<', "${lk_path}MAINTAINERS")
304 or die "$P: Can't open MAINTAINERS: $!\n";
305while (<$maint>) {
cb7301c7
JP
306 my $line = $_;
307
ce8155f7 308 if ($line =~ m/^([A-Z]):\s*(.*)/) {
cb7301c7
JP
309 my $type = $1;
310 my $value = $2;
311
312 ##Filename pattern matching
313 if ($type eq "F" || $type eq "X") {
314 $value =~ s@\.@\\\.@g; ##Convert . to \.
315 $value =~ s/\*/\.\*/g; ##Convert * to .*
316 $value =~ s/\?/\./g; ##Convert ? to .
870020f9
JP
317 ##if pattern is a directory and it lacks a trailing slash, add one
318 if ((-d $value)) {
319 $value =~ s@([^/])$@$1/@;
320 }
dcf36a92
JP
321 } elsif ($type eq "K") {
322 $keyword_hash{@typevalue} = $value;
cb7301c7
JP
323 }
324 push(@typevalue, "$type:$value");
325 } elsif (!/^(\s)*$/) {
326 $line =~ s/\n$//g;
327 push(@typevalue, $line);
328 }
329}
22dd5b0c 330close($maint);
cb7301c7 331
8cbb3a77 332
7fa8ff2e
FM
333#
334# Read mail address map
335#
336
b9e2331d
JP
337my $mailmap;
338
339read_mailmap();
7fa8ff2e
FM
340
341sub read_mailmap {
b9e2331d 342 $mailmap = {
7fa8ff2e
FM
343 names => {},
344 addresses => {}
47abc722 345 };
7fa8ff2e 346
b9e2331d 347 return if (!$email_use_mailmap || !(-f "${lk_path}.mailmap"));
7fa8ff2e
FM
348
349 open(my $mailmap_file, '<', "${lk_path}.mailmap")
22dd5b0c 350 or warn "$P: Can't open .mailmap: $!\n";
8cbb3a77 351
7fa8ff2e
FM
352 while (<$mailmap_file>) {
353 s/#.*$//; #strip comments
354 s/^\s+|\s+$//g; #trim
8cbb3a77 355
7fa8ff2e
FM
356 next if (/^\s*$/); #skip empty lines
357 #entries have one of the following formats:
358 # name1 <mail1>
359 # <mail1> <mail2>
360 # name1 <mail1> <mail2>
361 # name1 <mail1> name2 <mail2>
362 # (see man git-shortlog)
0334b382
JP
363
364 if (/^([^<]+)<([^>]+)>$/) {
47abc722
JP
365 my $real_name = $1;
366 my $address = $2;
8cbb3a77 367
47abc722 368 $real_name =~ s/\s+$//;
b9e2331d 369 ($real_name, $address) = parse_email("$real_name <$address>");
47abc722 370 $mailmap->{names}->{$address} = $real_name;
8cbb3a77 371
0334b382 372 } elsif (/^<([^>]+)>\s*<([^>]+)>$/) {
47abc722
JP
373 my $real_address = $1;
374 my $wrong_address = $2;
7fa8ff2e 375
47abc722 376 $mailmap->{addresses}->{$wrong_address} = $real_address;
7fa8ff2e 377
0334b382 378 } elsif (/^(.+)<([^>]+)>\s*<([^>]+)>$/) {
b9e2331d 379 my $real_name = $1;
47abc722
JP
380 my $real_address = $2;
381 my $wrong_address = $3;
7fa8ff2e 382
47abc722 383 $real_name =~ s/\s+$//;
b9e2331d
JP
384 ($real_name, $real_address) =
385 parse_email("$real_name <$real_address>");
47abc722
JP
386 $mailmap->{names}->{$wrong_address} = $real_name;
387 $mailmap->{addresses}->{$wrong_address} = $real_address;
7fa8ff2e 388
0334b382 389 } elsif (/^(.+)<([^>]+)>\s*(.+)\s*<([^>]+)>$/) {
47abc722
JP
390 my $real_name = $1;
391 my $real_address = $2;
392 my $wrong_name = $3;
393 my $wrong_address = $4;
7fa8ff2e 394
47abc722 395 $real_name =~ s/\s+$//;
b9e2331d
JP
396 ($real_name, $real_address) =
397 parse_email("$real_name <$real_address>");
398
47abc722 399 $wrong_name =~ s/\s+$//;
b9e2331d
JP
400 ($wrong_name, $wrong_address) =
401 parse_email("$wrong_name <$wrong_address>");
7fa8ff2e 402
b9e2331d
JP
403 my $wrong_email = format_email($wrong_name, $wrong_address, 1);
404 $mailmap->{names}->{$wrong_email} = $real_name;
405 $mailmap->{addresses}->{$wrong_email} = $real_address;
11ecf53c 406 }
8cbb3a77 407 }
7fa8ff2e 408 close($mailmap_file);
8cbb3a77
JP
409}
410
4a7fdb5f 411## use the filenames on the command line or find the filenames in the patchfiles
cb7301c7
JP
412
413my @files = ();
f5492666 414my @range = ();
dcf36a92 415my @keyword_tvi = ();
03372dbb 416my @file_emails = ();
cb7301c7 417
64f77f31
JP
418if (!@ARGV) {
419 push(@ARGV, "&STDIN");
420}
421
4a7fdb5f 422foreach my $file (@ARGV) {
64f77f31
JP
423 if ($file ne "&STDIN") {
424 ##if $file is a directory and it lacks a trailing slash, add one
425 if ((-d $file)) {
426 $file =~ s@([^/])$@$1/@;
427 } elsif (!(-f $file)) {
428 die "$P: file '${file}' not found\n";
429 }
cb7301c7 430 }
4a7fdb5f
JP
431 if ($from_filename) {
432 push(@files, $file);
fab9ed12 433 if ($file ne "MAINTAINERS" && -f $file && ($keywords || $file_emails)) {
22dd5b0c
SH
434 open(my $f, '<', $file)
435 or die "$P: Can't open $file: $!\n";
436 my $text = do { local($/) ; <$f> };
437 close($f);
03372dbb
JP
438 if ($keywords) {
439 foreach my $line (keys %keyword_hash) {
440 if ($text =~ m/$keyword_hash{$line}/x) {
441 push(@keyword_tvi, $line);
442 }
dcf36a92
JP
443 }
444 }
03372dbb
JP
445 if ($file_emails) {
446 my @poss_addr = $text =~ m$[A-Za-zÀ-ÿ\"\' \,\.\+-]*\s*[\,]*\s*[\(\<\{]{0,1}[A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+\.[A-Za-z0-9]+[\)\>\}]{0,1}$g;
447 push(@file_emails, clean_file_emails(@poss_addr));
448 }
dcf36a92 449 }
4a7fdb5f
JP
450 } else {
451 my $file_cnt = @files;
f5492666 452 my $lastfile;
22dd5b0c 453
3a4df13d 454 open(my $patch, "< $file")
22dd5b0c 455 or die "$P: Can't open $file: $!\n";
7764dcb5
JP
456
457 # We can check arbitrary information before the patch
458 # like the commit message, mail headers, etc...
459 # This allows us to match arbitrary keywords against any part
460 # of a git format-patch generated file (subject tags, etc...)
461
462 my $patch_prefix = ""; #Parsing the intro
463
22dd5b0c 464 while (<$patch>) {
dcf36a92 465 my $patch_line = $_;
6be0710c 466 if (m/^\+\+\+\s+(\S+)/ or m/^---\s+(\S+)/) {
4a7fdb5f
JP
467 my $filename = $1;
468 $filename =~ s@^[^/]*/@@;
469 $filename =~ s@\n@@;
f5492666 470 $lastfile = $filename;
4a7fdb5f 471 push(@files, $filename);
7764dcb5 472 $patch_prefix = "^[+-].*"; #Now parsing the actual patch
f5492666
JP
473 } elsif (m/^\@\@ -(\d+),(\d+)/) {
474 if ($email_git_blame) {
475 push(@range, "$lastfile:$1:$2");
476 }
dcf36a92
JP
477 } elsif ($keywords) {
478 foreach my $line (keys %keyword_hash) {
7764dcb5 479 if ($patch_line =~ m/${patch_prefix}$keyword_hash{$line}/x) {
dcf36a92
JP
480 push(@keyword_tvi, $line);
481 }
482 }
4a7fdb5f 483 }
cb7301c7 484 }
22dd5b0c
SH
485 close($patch);
486
4a7fdb5f 487 if ($file_cnt == @files) {
7f29fd27 488 warn "$P: file '${file}' doesn't appear to be a patch. "
4a7fdb5f
JP
489 . "Add -f to options?\n";
490 }
491 @files = sort_and_uniq(@files);
cb7301c7 492 }
cb7301c7
JP
493}
494
03372dbb
JP
495@file_emails = uniq(@file_emails);
496
683c6f8f
JP
497my %email_hash_name;
498my %email_hash_address;
cb7301c7 499my @email_to = ();
683c6f8f 500my %hash_list_to;
290603c1 501my @list_to = ();
cb7301c7
JP
502my @scm = ();
503my @web = ();
504my @subsystem = ();
505my @status = ();
b9e2331d
JP
506my %deduplicate_name_hash = ();
507my %deduplicate_address_hash = ();
cb7301c7 508
6ef1c52e 509my @maintainers = get_maintainers();
cb7301c7 510
6ef1c52e
JP
511if (@maintainers) {
512 @maintainers = merge_email(@maintainers);
513 output(@maintainers);
514}
683c6f8f
JP
515
516if ($scm) {
517 @scm = uniq(@scm);
518 output(@scm);
519}
520
521if ($status) {
522 @status = uniq(@status);
523 output(@status);
524}
525
526if ($subsystem) {
527 @subsystem = uniq(@subsystem);
528 output(@subsystem);
529}
530
531if ($web) {
532 @web = uniq(@web);
533 output(@web);
534}
535
536exit($exit);
537
435de078
JP
538sub ignore_email_address {
539 my ($address) = @_;
540
541 foreach my $ignore (@ignore_emails) {
542 return 1 if ($ignore eq $address);
543 }
544
545 return 0;
546}
547
ab6c937d
JP
548sub range_is_maintained {
549 my ($start, $end) = @_;
550
551 for (my $i = $start; $i < $end; $i++) {
552 my $line = $typevalue[$i];
ce8155f7 553 if ($line =~ m/^([A-Z]):\s*(.*)/) {
ab6c937d
JP
554 my $type = $1;
555 my $value = $2;
556 if ($type eq 'S') {
557 if ($value =~ /(maintain|support)/i) {
558 return 1;
559 }
560 }
561 }
562 }
563 return 0;
564}
565
566sub range_has_maintainer {
567 my ($start, $end) = @_;
568
569 for (my $i = $start; $i < $end; $i++) {
570 my $line = $typevalue[$i];
ce8155f7 571 if ($line =~ m/^([A-Z]):\s*(.*)/) {
ab6c937d
JP
572 my $type = $1;
573 my $value = $2;
574 if ($type eq 'M') {
575 return 1;
576 }
577 }
578 }
579 return 0;
580}
581
6ef1c52e 582sub get_maintainers {
683c6f8f
JP
583 %email_hash_name = ();
584 %email_hash_address = ();
585 %commit_author_hash = ();
586 %commit_signer_hash = ();
587 @email_to = ();
588 %hash_list_to = ();
589 @list_to = ();
590 @scm = ();
591 @web = ();
592 @subsystem = ();
593 @status = ();
b9e2331d
JP
594 %deduplicate_name_hash = ();
595 %deduplicate_address_hash = ();
683c6f8f
JP
596 if ($email_git_all_signature_types) {
597 $signature_pattern = "(.+?)[Bb][Yy]:";
598 } else {
599 $signature_pattern = "\(" . join("|", @signature_tags) . "\)";
600 }
601
602 # Find responsible parties
603
b9e2331d 604 my %exact_pattern_match_hash = ();
6ef1c52e 605
683c6f8f
JP
606 foreach my $file (@files) {
607
608 my %hash;
683c6f8f
JP
609 my $tvi = find_first_section();
610 while ($tvi < @typevalue) {
611 my $start = find_starting_index($tvi);
612 my $end = find_ending_index($tvi);
613 my $exclude = 0;
614 my $i;
615
616 #Do not match excluded file patterns
272a8979 617
272a8979
JP
618 for ($i = $start; $i < $end; $i++) {
619 my $line = $typevalue[$i];
ce8155f7 620 if ($line =~ m/^([A-Z]):\s*(.*)/) {
272a8979
JP
621 my $type = $1;
622 my $value = $2;
683c6f8f 623 if ($type eq 'X') {
272a8979 624 if (file_match_pattern($file, $value)) {
683c6f8f
JP
625 $exclude = 1;
626 last;
627 }
628 }
629 }
630 }
631
632 if (!$exclude) {
633 for ($i = $start; $i < $end; $i++) {
634 my $line = $typevalue[$i];
ce8155f7 635 if ($line =~ m/^([A-Z]):\s*(.*)/) {
683c6f8f
JP
636 my $type = $1;
637 my $value = $2;
638 if ($type eq 'F') {
639 if (file_match_pattern($file, $value)) {
640 my $value_pd = ($value =~ tr@/@@);
641 my $file_pd = ($file =~ tr@/@@);
642 $value_pd++ if (substr($value,-1,1) ne "/");
643 $value_pd = -1 if ($value =~ /^\.\*/);
ab6c937d
JP
644 if ($value_pd >= $file_pd &&
645 range_is_maintained($start, $end) &&
646 range_has_maintainer($start, $end)) {
6ef1c52e
JP
647 $exact_pattern_match_hash{$file} = 1;
648 }
683c6f8f
JP
649 if ($pattern_depth == 0 ||
650 (($file_pd - $value_pd) < $pattern_depth)) {
651 $hash{$tvi} = $value_pd;
652 }
272a8979 653 }
bbbe96ed 654 } elsif ($type eq 'N') {
eb90d085
SW
655 if ($file =~ m/$value/x) {
656 $hash{$tvi} = 0;
657 }
272a8979
JP
658 }
659 }
660 }
661 }
683c6f8f 662 $tvi = $end + 1;
1d606b4e 663 }
272a8979 664
683c6f8f
JP
665 foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
666 add_categories($line);
667 if ($sections) {
668 my $i;
669 my $start = find_starting_index($line);
670 my $end = find_ending_index($line);
671 for ($i = $start; $i < $end; $i++) {
672 my $line = $typevalue[$i];
673 if ($line =~ /^[FX]:/) { ##Restore file patterns
674 $line =~ s/([^\\])\.([^\*])/$1\?$2/g;
675 $line =~ s/([^\\])\.$/$1\?/g; ##Convert . back to ?
676 $line =~ s/\\\./\./g; ##Convert \. to .
677 $line =~ s/\.\*/\*/g; ##Convert .* to *
678 }
679 $line =~ s/^([A-Z]):/$1:\t/g;
680 print("$line\n");
4b76c9da 681 }
683c6f8f 682 print("\n");
4b76c9da 683 }
6ffd9485 684 }
dace8e30 685 }
cb7301c7 686
683c6f8f
JP
687 if ($keywords) {
688 @keyword_tvi = sort_and_uniq(@keyword_tvi);
689 foreach my $line (@keyword_tvi) {
690 add_categories($line);
691 }
dcf36a92 692 }
dcf36a92 693
b9e2331d
JP
694 foreach my $email (@email_to, @list_to) {
695 $email->[0] = deduplicate_email($email->[0]);
696 }
6ef1c52e
JP
697
698 foreach my $file (@files) {
699 if ($email &&
700 ($email_git || ($email_git_fallback &&
701 !$exact_pattern_match_hash{$file}))) {
702 vcs_file_signoffs($file);
703 }
704 if ($email && $email_git_blame) {
705 vcs_file_blame($file);
706 }
707 }
708
683c6f8f
JP
709 if ($email) {
710 foreach my $chief (@penguin_chief) {
711 if ($chief =~ m/^(.*):(.*)/) {
712 my $email_address;
0e70e83d 713
683c6f8f
JP
714 $email_address = format_email($1, $2, $email_usename);
715 if ($email_git_penguin_chiefs) {
716 push(@email_to, [$email_address, 'chief penguin']);
717 } else {
718 @email_to = grep($_->[0] !~ /${email_address}/, @email_to);
719 }
cb7301c7
JP
720 }
721 }
03372dbb 722
683c6f8f
JP
723 foreach my $email (@file_emails) {
724 my ($name, $address) = parse_email($email);
03372dbb 725
683c6f8f
JP
726 my $tmp_email = format_email($name, $address, $email_usename);
727 push_email_address($tmp_email, '');
728 add_role($tmp_email, 'in file');
729 }
03372dbb 730 }
cb7301c7 731
290603c1 732 my @to = ();
683c6f8f
JP
733 if ($email || $email_list) {
734 if ($email) {
735 @to = (@to, @email_to);
736 }
737 if ($email_list) {
738 @to = (@to, @list_to);
dace8e30 739 }
290603c1 740 }
cb7301c7 741
6ef1c52e 742 if ($interactive) {
b9e2331d 743 @to = interactive_get_maintainers(\@to);
6ef1c52e 744 }
cb7301c7 745
683c6f8f 746 return @to;
cb7301c7
JP
747}
748
cb7301c7
JP
749sub file_match_pattern {
750 my ($file, $pattern) = @_;
751 if (substr($pattern, -1) eq "/") {
752 if ($file =~ m@^$pattern@) {
753 return 1;
754 }
755 } else {
756 if ($file =~ m@^$pattern@) {
757 my $s1 = ($file =~ tr@/@@);
758 my $s2 = ($pattern =~ tr@/@@);
759 if ($s1 == $s2) {
760 return 1;
761 }
762 }
763 }
764 return 0;
765}
766
767sub usage {
768 print <<EOT;
769usage: $P [options] patchfile
870020f9 770 $P [options] -f file|directory
cb7301c7
JP
771version: $V
772
773MAINTAINER field selection options:
774 --email => print email address(es) if any
775 --git => include recent git \*-by: signers
e4d26b02 776 --git-all-signature-types => include signers regardless of signature type
683c6f8f 777 or use only ${signature_pattern} signers (default: $email_git_all_signature_types)
e3e9d114 778 --git-fallback => use git when no exact MAINTAINERS pattern (default: $email_git_fallback)
cb7301c7 779 --git-chief-penguins => include ${penguin_chiefs}
e4d26b02
JP
780 --git-min-signatures => number of signatures required (default: $email_git_min_signatures)
781 --git-max-maintainers => maximum maintainers to add (default: $email_git_max_maintainers)
782 --git-min-percent => minimum percentage of commits required (default: $email_git_min_percent)
f5492666 783 --git-blame => use git blame to find modified commits for patch or file
3cbcca8a 784 --git-blame-signatures => when used with --git-blame, also include all commit signers
e4d26b02
JP
785 --git-since => git history to use (default: $email_git_since)
786 --hg-since => hg history to use (default: $email_hg_since)
dace8e30 787 --interactive => display a menu (mostly useful if used with the --git option)
cb7301c7 788 --m => include maintainer(s) if any
c1c3f2c9 789 --r => include reviewer(s) if any
cb7301c7
JP
790 --n => include name 'Full Name <addr\@domain.tld>'
791 --l => include list(s) if any
792 --s => include subscriber only list(s) if any
11ecf53c 793 --remove-duplicates => minimize duplicate email names/addresses
3c7385b8
JP
794 --roles => show roles (status:subsystem, git-signer, list, etc...)
795 --rolestats => show roles and statistics (commits/total_commits, %)
03372dbb 796 --file-emails => add email addresses found in -f file (default: 0 (off))
cb7301c7
JP
797 --scm => print SCM tree(s) if any
798 --status => print status if any
799 --subsystem => print subsystem name if any
800 --web => print website(s) if any
801
802Output type options:
803 --separator [, ] => separator for multiple entries on 1 line
42498316 804 using --separator also sets --nomultiline if --separator is not [, ]
cb7301c7
JP
805 --multiline => print 1 entry per line
806
cb7301c7 807Other options:
3fb55652 808 --pattern-depth => Number of pattern directory traversals (default: 0 (all))
b9e2331d
JP
809 --keywords => scan patch for keywords (default: $keywords)
810 --sections => print all of the subsystem sections with pattern matches
811 --mailmap => use .mailmap file (default: $email_use_mailmap)
f5f5078d 812 --version => show version
cb7301c7
JP
813 --help => show this help information
814
3fb55652 815Default options:
cc7ff0ef 816 [--email --nogit --git-fallback --m --n --l --multiline --pattern-depth=0
7e1863af 817 --remove-duplicates --rolestats]
3fb55652 818
870020f9
JP
819Notes:
820 Using "-f directory" may give unexpected results:
f5492666
JP
821 Used with "--git", git signators for _all_ files in and below
822 directory are examined as git recurses directories.
823 Any specified X: (exclude) pattern matches are _not_ ignored.
824 Used with "--nogit", directory is used as a pattern match,
60db31ac
JP
825 no individual file within the directory or subdirectory
826 is matched.
f5492666
JP
827 Used with "--git-blame", does not iterate all files in directory
828 Using "--git-blame" is slow and may add old committers and authors
829 that are no longer active maintainers to the output.
3c7385b8
JP
830 Using "--roles" or "--rolestats" with git send-email --cc-cmd or any
831 other automated tools that expect only ["name"] <email address>
832 may not work because of additional output after <email address>.
833 Using "--rolestats" and "--git-blame" shows the #/total=% commits,
834 not the percentage of the entire file authored. # of commits is
835 not a good measure of amount of code authored. 1 major commit may
836 contain a thousand lines, 5 trivial commits may modify a single line.
60db31ac
JP
837 If git is not installed, but mercurial (hg) is installed and an .hg
838 repository exists, the following options apply to mercurial:
839 --git,
840 --git-min-signatures, --git-max-maintainers, --git-min-percent, and
841 --git-blame
842 Use --hg-since not --git-since to control date selection
368669da
JP
843 File ".get_maintainer.conf", if it exists in the linux kernel source root
844 directory, can change whatever get_maintainer defaults are desired.
845 Entries in this file can be any command line argument.
846 This file is prepended to any additional command line arguments.
847 Multiple lines and # comments are allowed.
b1312bfe
BN
848 Most options have both positive and negative forms.
849 The negative forms for --<foo> are --no<foo> and --no-<foo>.
850
cb7301c7
JP
851EOT
852}
853
854sub top_of_kernel_tree {
47abc722 855 my ($lk_path) = @_;
cb7301c7 856
47abc722
JP
857 if ($lk_path ne "" && substr($lk_path,length($lk_path)-1,1) ne "/") {
858 $lk_path .= "/";
859 }
860 if ( (-f "${lk_path}COPYING")
861 && (-f "${lk_path}CREDITS")
862 && (-f "${lk_path}Kbuild")
863 && (-f "${lk_path}MAINTAINERS")
864 && (-f "${lk_path}Makefile")
865 && (-f "${lk_path}README")
866 && (-d "${lk_path}Documentation")
867 && (-d "${lk_path}arch")
868 && (-d "${lk_path}include")
869 && (-d "${lk_path}drivers")
870 && (-d "${lk_path}fs")
871 && (-d "${lk_path}init")
872 && (-d "${lk_path}ipc")
873 && (-d "${lk_path}kernel")
874 && (-d "${lk_path}lib")
875 && (-d "${lk_path}scripts")) {
876 return 1;
877 }
878 return 0;
cb7301c7
JP
879}
880
0e70e83d
JP
881sub parse_email {
882 my ($formatted_email) = @_;
883
884 my $name = "";
885 my $address = "";
886
11ecf53c 887 if ($formatted_email =~ /^([^<]+)<(.+\@.*)>.*$/) {
0e70e83d
JP
888 $name = $1;
889 $address = $2;
11ecf53c 890 } elsif ($formatted_email =~ /^\s*<(.+\@\S*)>.*$/) {
0e70e83d 891 $address = $1;
b781655a 892 } elsif ($formatted_email =~ /^(.+\@\S*).*$/) {
0e70e83d
JP
893 $address = $1;
894 }
cb7301c7
JP
895
896 $name =~ s/^\s+|\s+$//g;
d789504a 897 $name =~ s/^\"|\"$//g;
0e70e83d 898 $address =~ s/^\s+|\s+$//g;
cb7301c7 899
a63ceb4c 900 if ($name =~ /[^\w \-]/i) { ##has "must quote" chars
0e70e83d
JP
901 $name =~ s/(?<!\\)"/\\"/g; ##escape quotes
902 $name = "\"$name\"";
903 }
904
905 return ($name, $address);
906}
907
908sub format_email {
a8af2430 909 my ($name, $address, $usename) = @_;
0e70e83d
JP
910
911 my $formatted_email;
912
913 $name =~ s/^\s+|\s+$//g;
914 $name =~ s/^\"|\"$//g;
915 $address =~ s/^\s+|\s+$//g;
cb7301c7 916
a63ceb4c 917 if ($name =~ /[^\w \-]/i) { ##has "must quote" chars
cb7301c7 918 $name =~ s/(?<!\\)"/\\"/g; ##escape quotes
0e70e83d
JP
919 $name = "\"$name\"";
920 }
921
a8af2430 922 if ($usename) {
0e70e83d
JP
923 if ("$name" eq "") {
924 $formatted_email = "$address";
925 } else {
a8af2430 926 $formatted_email = "$name <$address>";
0e70e83d 927 }
cb7301c7 928 } else {
0e70e83d 929 $formatted_email = $address;
cb7301c7 930 }
0e70e83d 931
cb7301c7
JP
932 return $formatted_email;
933}
934
272a8979
JP
935sub find_first_section {
936 my $index = 0;
937
938 while ($index < @typevalue) {
939 my $tv = $typevalue[$index];
ce8155f7 940 if (($tv =~ m/^([A-Z]):\s*(.*)/)) {
272a8979
JP
941 last;
942 }
943 $index++;
944 }
945
946 return $index;
947}
948
b781655a 949sub find_starting_index {
b781655a
JP
950 my ($index) = @_;
951
952 while ($index > 0) {
953 my $tv = $typevalue[$index];
ce8155f7 954 if (!($tv =~ m/^([A-Z]):\s*(.*)/)) {
b781655a
JP
955 last;
956 }
957 $index--;
958 }
959
960 return $index;
961}
962
963sub find_ending_index {
cb7301c7
JP
964 my ($index) = @_;
965
b781655a 966 while ($index < @typevalue) {
cb7301c7 967 my $tv = $typevalue[$index];
ce8155f7 968 if (!($tv =~ m/^([A-Z]):\s*(.*)/)) {
b781655a
JP
969 last;
970 }
971 $index++;
972 }
973
974 return $index;
975}
976
3c7385b8
JP
977sub get_maintainer_role {
978 my ($index) = @_;
979
980 my $i;
981 my $start = find_starting_index($index);
982 my $end = find_ending_index($index);
983
0ede2745 984 my $role = "unknown";
3c7385b8 985 my $subsystem = $typevalue[$start];
364f68dc
JP
986 if ($output_section_maxlen && length($subsystem) > $output_section_maxlen) {
987 $subsystem = substr($subsystem, 0, $output_section_maxlen - 3);
3c7385b8
JP
988 $subsystem =~ s/\s*$//;
989 $subsystem = $subsystem . "...";
990 }
991
992 for ($i = $start + 1; $i < $end; $i++) {
993 my $tv = $typevalue[$i];
ce8155f7 994 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
3c7385b8
JP
995 my $ptype = $1;
996 my $pvalue = $2;
997 if ($ptype eq "S") {
998 $role = $pvalue;
999 }
1000 }
1001 }
1002
1003 $role = lc($role);
1004 if ($role eq "supported") {
1005 $role = "supporter";
1006 } elsif ($role eq "maintained") {
1007 $role = "maintainer";
1008 } elsif ($role eq "odd fixes") {
1009 $role = "odd fixer";
1010 } elsif ($role eq "orphan") {
1011 $role = "orphan minder";
1012 } elsif ($role eq "obsolete") {
1013 $role = "obsolete minder";
1014 } elsif ($role eq "buried alive in reporters") {
1015 $role = "chief penguin";
1016 }
1017
1018 return $role . ":" . $subsystem;
1019}
1020
1021sub get_list_role {
1022 my ($index) = @_;
1023
1024 my $i;
1025 my $start = find_starting_index($index);
1026 my $end = find_ending_index($index);
1027
1028 my $subsystem = $typevalue[$start];
364f68dc
JP
1029 if ($output_section_maxlen && length($subsystem) > $output_section_maxlen) {
1030 $subsystem = substr($subsystem, 0, $output_section_maxlen - 3);
3c7385b8
JP
1031 $subsystem =~ s/\s*$//;
1032 $subsystem = $subsystem . "...";
1033 }
1034
1035 if ($subsystem eq "THE REST") {
1036 $subsystem = "";
1037 }
1038
1039 return $subsystem;
1040}
1041
b781655a
JP
1042sub add_categories {
1043 my ($index) = @_;
1044
1045 my $i;
1046 my $start = find_starting_index($index);
1047 my $end = find_ending_index($index);
1048
1049 push(@subsystem, $typevalue[$start]);
1050
1051 for ($i = $start + 1; $i < $end; $i++) {
1052 my $tv = $typevalue[$i];
ce8155f7 1053 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
cb7301c7
JP
1054 my $ptype = $1;
1055 my $pvalue = $2;
1056 if ($ptype eq "L") {
290603c1
JP
1057 my $list_address = $pvalue;
1058 my $list_additional = "";
3c7385b8
JP
1059 my $list_role = get_list_role($i);
1060
1061 if ($list_role ne "") {
1062 $list_role = ":" . $list_role;
1063 }
290603c1
JP
1064 if ($list_address =~ m/([^\s]+)\s+(.*)$/) {
1065 $list_address = $1;
1066 $list_additional = $2;
1067 }
bdf7c685 1068 if ($list_additional =~ m/subscribers-only/) {
cb7301c7 1069 if ($email_subscriber_list) {
6ef1c52e
JP
1070 if (!$hash_list_to{lc($list_address)}) {
1071 $hash_list_to{lc($list_address)} = 1;
683c6f8f
JP
1072 push(@list_to, [$list_address,
1073 "subscriber list${list_role}"]);
1074 }
cb7301c7
JP
1075 }
1076 } else {
1077 if ($email_list) {
6ef1c52e
JP
1078 if (!$hash_list_to{lc($list_address)}) {
1079 $hash_list_to{lc($list_address)} = 1;
728f5a94
RW
1080 if ($list_additional =~ m/moderated/) {
1081 push(@list_to, [$list_address,
1082 "moderated list${list_role}"]);
1083 } else {
1084 push(@list_to, [$list_address,
1085 "open list${list_role}"]);
1086 }
683c6f8f 1087 }
cb7301c7
JP
1088 }
1089 }
1090 } elsif ($ptype eq "M") {
0e70e83d
JP
1091 my ($name, $address) = parse_email($pvalue);
1092 if ($name eq "") {
b781655a
JP
1093 if ($i > 0) {
1094 my $tv = $typevalue[$i - 1];
ce8155f7 1095 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
0e70e83d
JP
1096 if ($1 eq "P") {
1097 $name = $2;
a8af2430 1098 $pvalue = format_email($name, $address, $email_usename);
5f2441e9
JP
1099 }
1100 }
1101 }
1102 }
0e70e83d 1103 if ($email_maintainer) {
3c7385b8
JP
1104 my $role = get_maintainer_role($i);
1105 push_email_addresses($pvalue, $role);
cb7301c7 1106 }
c1c3f2c9
JP
1107 } elsif ($ptype eq "R") {
1108 my ($name, $address) = parse_email($pvalue);
1109 if ($name eq "") {
1110 if ($i > 0) {
1111 my $tv = $typevalue[$i - 1];
ce8155f7 1112 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
c1c3f2c9
JP
1113 if ($1 eq "P") {
1114 $name = $2;
1115 $pvalue = format_email($name, $address, $email_usename);
1116 }
1117 }
1118 }
1119 }
1120 if ($email_reviewer) {
1121 push_email_addresses($pvalue, 'reviewer');
1122 }
cb7301c7
JP
1123 } elsif ($ptype eq "T") {
1124 push(@scm, $pvalue);
1125 } elsif ($ptype eq "W") {
1126 push(@web, $pvalue);
1127 } elsif ($ptype eq "S") {
1128 push(@status, $pvalue);
1129 }
cb7301c7
JP
1130 }
1131 }
1132}
1133
11ecf53c
JP
1134sub email_inuse {
1135 my ($name, $address) = @_;
1136
1137 return 1 if (($name eq "") && ($address eq ""));
6ef1c52e
JP
1138 return 1 if (($name ne "") && exists($email_hash_name{lc($name)}));
1139 return 1 if (($address ne "") && exists($email_hash_address{lc($address)}));
0e70e83d 1140
0e70e83d
JP
1141 return 0;
1142}
1143
1b5e1cf6 1144sub push_email_address {
3c7385b8 1145 my ($line, $role) = @_;
1b5e1cf6 1146
0e70e83d 1147 my ($name, $address) = parse_email($line);
1b5e1cf6 1148
b781655a
JP
1149 if ($address eq "") {
1150 return 0;
1151 }
1152
11ecf53c 1153 if (!$email_remove_duplicates) {
a8af2430 1154 push(@email_to, [format_email($name, $address, $email_usename), $role]);
11ecf53c 1155 } elsif (!email_inuse($name, $address)) {
a8af2430 1156 push(@email_to, [format_email($name, $address, $email_usename), $role]);
fae99206 1157 $email_hash_name{lc($name)}++ if ($name ne "");
6ef1c52e 1158 $email_hash_address{lc($address)}++;
1b5e1cf6 1159 }
b781655a
JP
1160
1161 return 1;
1b5e1cf6
JP
1162}
1163
1164sub push_email_addresses {
3c7385b8 1165 my ($address, $role) = @_;
1b5e1cf6
JP
1166
1167 my @address_list = ();
1168
5f2441e9 1169 if (rfc822_valid($address)) {
3c7385b8 1170 push_email_address($address, $role);
5f2441e9 1171 } elsif (@address_list = rfc822_validlist($address)) {
1b5e1cf6
JP
1172 my $array_count = shift(@address_list);
1173 while (my $entry = shift(@address_list)) {
3c7385b8 1174 push_email_address($entry, $role);
1b5e1cf6 1175 }
5f2441e9 1176 } else {
3c7385b8 1177 if (!push_email_address($address, $role)) {
b781655a
JP
1178 warn("Invalid MAINTAINERS address: '" . $address . "'\n");
1179 }
1b5e1cf6 1180 }
1b5e1cf6
JP
1181}
1182
3c7385b8
JP
1183sub add_role {
1184 my ($line, $role) = @_;
1185
1186 my ($name, $address) = parse_email($line);
a8af2430 1187 my $email = format_email($name, $address, $email_usename);
3c7385b8
JP
1188
1189 foreach my $entry (@email_to) {
1190 if ($email_remove_duplicates) {
1191 my ($entry_name, $entry_address) = parse_email($entry->[0]);
03372dbb
JP
1192 if (($name eq $entry_name || $address eq $entry_address)
1193 && ($role eq "" || !($entry->[1] =~ m/$role/))
1194 ) {
3c7385b8
JP
1195 if ($entry->[1] eq "") {
1196 $entry->[1] = "$role";
1197 } else {
1198 $entry->[1] = "$entry->[1],$role";
1199 }
1200 }
1201 } else {
03372dbb
JP
1202 if ($email eq $entry->[0]
1203 && ($role eq "" || !($entry->[1] =~ m/$role/))
1204 ) {
3c7385b8
JP
1205 if ($entry->[1] eq "") {
1206 $entry->[1] = "$role";
1207 } else {
1208 $entry->[1] = "$entry->[1],$role";
1209 }
1210 }
1211 }
1212 }
1213}
1214
cb7301c7
JP
1215sub which {
1216 my ($bin) = @_;
1217
f5f5078d 1218 foreach my $path (split(/:/, $ENV{PATH})) {
cb7301c7
JP
1219 if (-e "$path/$bin") {
1220 return "$path/$bin";
1221 }
1222 }
1223
1224 return "";
1225}
1226
bcde44ed
JP
1227sub which_conf {
1228 my ($conf) = @_;
1229
1230 foreach my $path (split(/:/, ".:$ENV{HOME}:.scripts")) {
1231 if (-e "$path/$conf") {
1232 return "$path/$conf";
1233 }
1234 }
1235
1236 return "";
1237}
1238
7fa8ff2e 1239sub mailmap_email {
b9e2331d 1240 my ($line) = @_;
7fa8ff2e 1241
47abc722
JP
1242 my ($name, $address) = parse_email($line);
1243 my $email = format_email($name, $address, 1);
1244 my $real_name = $name;
1245 my $real_address = $address;
1246
1247 if (exists $mailmap->{names}->{$email} ||
1248 exists $mailmap->{addresses}->{$email}) {
1249 if (exists $mailmap->{names}->{$email}) {
1250 $real_name = $mailmap->{names}->{$email};
1251 }
1252 if (exists $mailmap->{addresses}->{$email}) {
1253 $real_address = $mailmap->{addresses}->{$email};
1254 }
1255 } else {
1256 if (exists $mailmap->{names}->{$address}) {
1257 $real_name = $mailmap->{names}->{$address};
1258 }
1259 if (exists $mailmap->{addresses}->{$address}) {
1260 $real_address = $mailmap->{addresses}->{$address};
8cbb3a77 1261 }
47abc722
JP
1262 }
1263 return format_email($real_name, $real_address, 1);
7fa8ff2e
FM
1264}
1265
1266sub mailmap {
1267 my (@addresses) = @_;
1268
b9e2331d 1269 my @mapped_emails = ();
7fa8ff2e 1270 foreach my $line (@addresses) {
b9e2331d 1271 push(@mapped_emails, mailmap_email($line));
8cbb3a77 1272 }
b9e2331d
JP
1273 merge_by_realname(@mapped_emails) if ($email_use_mailmap);
1274 return @mapped_emails;
7fa8ff2e
FM
1275}
1276
1277sub merge_by_realname {
47abc722
JP
1278 my %address_map;
1279 my (@emails) = @_;
b9e2331d 1280
47abc722
JP
1281 foreach my $email (@emails) {
1282 my ($name, $address) = parse_email($email);
b9e2331d 1283 if (exists $address_map{$name}) {
47abc722 1284 $address = $address_map{$name};
b9e2331d
JP
1285 $email = format_email($name, $address, 1);
1286 } else {
1287 $address_map{$name} = $address;
7fa8ff2e 1288 }
47abc722 1289 }
8cbb3a77
JP
1290}
1291
60db31ac
JP
1292sub git_execute_cmd {
1293 my ($cmd) = @_;
1294 my @lines = ();
cb7301c7 1295
60db31ac
JP
1296 my $output = `$cmd`;
1297 $output =~ s/^\s*//gm;
1298 @lines = split("\n", $output);
1299
1300 return @lines;
a8af2430
JP
1301}
1302
60db31ac 1303sub hg_execute_cmd {
a8af2430 1304 my ($cmd) = @_;
60db31ac
JP
1305 my @lines = ();
1306
1307 my $output = `$cmd`;
1308 @lines = split("\n", $output);
a8af2430 1309
60db31ac
JP
1310 return @lines;
1311}
1312
683c6f8f
JP
1313sub extract_formatted_signatures {
1314 my (@signature_lines) = @_;
1315
1316 my @type = @signature_lines;
1317
1318 s/\s*(.*):.*/$1/ for (@type);
1319
1320 # cut -f2- -d":"
1321 s/\s*.*:\s*(.+)\s*/$1/ for (@signature_lines);
1322
1323## Reformat email addresses (with names) to avoid badly written signatures
1324
1325 foreach my $signer (@signature_lines) {
b9e2331d 1326 $signer = deduplicate_email($signer);
683c6f8f
JP
1327 }
1328
1329 return (\@type, \@signature_lines);
1330}
1331
60db31ac 1332sub vcs_find_signers {
c9ecefea 1333 my ($cmd, $file) = @_;
a8af2430 1334 my $commits;
683c6f8f
JP
1335 my @lines = ();
1336 my @signatures = ();
c9ecefea
JP
1337 my @authors = ();
1338 my @stats = ();
a8af2430 1339
60db31ac 1340 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
cb7301c7 1341
60db31ac 1342 my $pattern = $VCS_cmds{"commit_pattern"};
c9ecefea
JP
1343 my $author_pattern = $VCS_cmds{"author_pattern"};
1344 my $stat_pattern = $VCS_cmds{"stat_pattern"};
1345
1346 $stat_pattern =~ s/(\$\w+)/$1/eeg; #interpolate $stat_pattern
cb7301c7 1347
60db31ac 1348 $commits = grep(/$pattern/, @lines); # of commits
afa81ee1 1349
c9ecefea 1350 @authors = grep(/$author_pattern/, @lines);
683c6f8f 1351 @signatures = grep(/^[ \t]*${signature_pattern}.*\@.*$/, @lines);
c9ecefea 1352 @stats = grep(/$stat_pattern/, @lines);
63ab52db 1353
c9ecefea
JP
1354# print("stats: <@stats>\n");
1355
1356 return (0, \@signatures, \@authors, \@stats) if !@signatures;
63ab52db 1357
683c6f8f
JP
1358 save_commits_by_author(@lines) if ($interactive);
1359 save_commits_by_signer(@lines) if ($interactive);
0e70e83d 1360
683c6f8f
JP
1361 if (!$email_git_penguin_chiefs) {
1362 @signatures = grep(!/${penguin_chiefs}/i, @signatures);
a8af2430
JP
1363 }
1364
c9ecefea 1365 my ($author_ref, $authors_ref) = extract_formatted_signatures(@authors);
683c6f8f
JP
1366 my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
1367
c9ecefea 1368 return ($commits, $signers_ref, $authors_ref, \@stats);
a8af2430
JP
1369}
1370
63ab52db
JP
1371sub vcs_find_author {
1372 my ($cmd) = @_;
1373 my @lines = ();
1374
1375 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1376
1377 if (!$email_git_penguin_chiefs) {
1378 @lines = grep(!/${penguin_chiefs}/i, @lines);
1379 }
1380
1381 return @lines if !@lines;
1382
683c6f8f 1383 my @authors = ();
63ab52db 1384 foreach my $line (@lines) {
683c6f8f
JP
1385 if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1386 my $author = $1;
1387 my ($name, $address) = parse_email($author);
1388 $author = format_email($name, $address, 1);
1389 push(@authors, $author);
1390 }
63ab52db
JP
1391 }
1392
683c6f8f
JP
1393 save_commits_by_author(@lines) if ($interactive);
1394 save_commits_by_signer(@lines) if ($interactive);
1395
1396 return @authors;
63ab52db
JP
1397}
1398
60db31ac
JP
1399sub vcs_save_commits {
1400 my ($cmd) = @_;
1401 my @lines = ();
1402 my @commits = ();
1403
1404 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1405
1406 foreach my $line (@lines) {
1407 if ($line =~ m/$VCS_cmds{"blame_commit_pattern"}/) {
1408 push(@commits, $1);
1409 }
1410 }
1411
1412 return @commits;
1413}
1414
1415sub vcs_blame {
1416 my ($file) = @_;
1417 my $cmd;
1418 my @commits = ();
1419
1420 return @commits if (!(-f $file));
1421
1422 if (@range && $VCS_cmds{"blame_range_cmd"} eq "") {
1423 my @all_commits = ();
1424
1425 $cmd = $VCS_cmds{"blame_file_cmd"};
1426 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
1427 @all_commits = vcs_save_commits($cmd);
1428
1429 foreach my $file_range_diff (@range) {
1430 next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1431 my $diff_file = $1;
1432 my $diff_start = $2;
1433 my $diff_length = $3;
1434 next if ("$file" ne "$diff_file");
1435 for (my $i = $diff_start; $i < $diff_start + $diff_length; $i++) {
1436 push(@commits, $all_commits[$i]);
1437 }
1438 }
1439 } elsif (@range) {
1440 foreach my $file_range_diff (@range) {
1441 next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1442 my $diff_file = $1;
1443 my $diff_start = $2;
1444 my $diff_length = $3;
1445 next if ("$file" ne "$diff_file");
1446 $cmd = $VCS_cmds{"blame_range_cmd"};
1447 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
1448 push(@commits, vcs_save_commits($cmd));
1449 }
1450 } else {
1451 $cmd = $VCS_cmds{"blame_file_cmd"};
1452 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
1453 @commits = vcs_save_commits($cmd);
1454 }
1455
63ab52db
JP
1456 foreach my $commit (@commits) {
1457 $commit =~ s/^\^//g;
1458 }
1459
60db31ac
JP
1460 return @commits;
1461}
1462
1463my $printed_novcs = 0;
1464sub vcs_exists {
1465 %VCS_cmds = %VCS_cmds_git;
1466 return 1 if eval $VCS_cmds{"available"};
1467 %VCS_cmds = %VCS_cmds_hg;
683c6f8f 1468 return 2 if eval $VCS_cmds{"available"};
60db31ac
JP
1469 %VCS_cmds = ();
1470 if (!$printed_novcs) {
1471 warn("$P: No supported VCS found. Add --nogit to options?\n");
1472 warn("Using a git repository produces better results.\n");
1473 warn("Try Linus Torvalds' latest git repository using:\n");
3d1c2f72 1474 warn("git clone git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git\n");
60db31ac
JP
1475 $printed_novcs = 1;
1476 }
1477 return 0;
1478}
1479
683c6f8f 1480sub vcs_is_git {
b9e2331d 1481 vcs_exists();
683c6f8f
JP
1482 return $vcs_used == 1;
1483}
1484
1485sub vcs_is_hg {
1486 return $vcs_used == 2;
1487}
1488
6ef1c52e 1489sub interactive_get_maintainers {
683c6f8f 1490 my ($list_ref) = @_;
dace8e30
FM
1491 my @list = @$list_ref;
1492
683c6f8f 1493 vcs_exists();
dace8e30
FM
1494
1495 my %selected;
683c6f8f
JP
1496 my %authored;
1497 my %signed;
dace8e30 1498 my $count = 0;
6ef1c52e 1499 my $maintained = 0;
6ef1c52e 1500 foreach my $entry (@list) {
b9e2331d
JP
1501 $maintained = 1 if ($entry->[1] =~ /^(maintainer|supporter)/i);
1502 $selected{$count} = 1;
683c6f8f
JP
1503 $authored{$count} = 0;
1504 $signed{$count} = 0;
1505 $count++;
dace8e30
FM
1506 }
1507
1508 #menu loop
683c6f8f
JP
1509 my $done = 0;
1510 my $print_options = 0;
1511 my $redraw = 1;
1512 while (!$done) {
1513 $count = 0;
1514 if ($redraw) {
6ef1c52e
JP
1515 printf STDERR "\n%1s %2s %-65s",
1516 "*", "#", "email/list and role:stats";
1517 if ($email_git ||
1518 ($email_git_fallback && !$maintained) ||
1519 $email_git_blame) {
1520 print STDERR "auth sign";
1521 }
1522 print STDERR "\n";
683c6f8f
JP
1523 foreach my $entry (@list) {
1524 my $email = $entry->[0];
1525 my $role = $entry->[1];
1526 my $sel = "";
1527 $sel = "*" if ($selected{$count});
1528 my $commit_author = $commit_author_hash{$email};
1529 my $commit_signer = $commit_signer_hash{$email};
1530 my $authored = 0;
1531 my $signed = 0;
1532 $authored++ for (@{$commit_author});
1533 $signed++ for (@{$commit_signer});
1534 printf STDERR "%1s %2d %-65s", $sel, $count + 1, $email;
1535 printf STDERR "%4d %4d", $authored, $signed
1536 if ($authored > 0 || $signed > 0);
1537 printf STDERR "\n %s\n", $role;
1538 if ($authored{$count}) {
1539 my $commit_author = $commit_author_hash{$email};
1540 foreach my $ref (@{$commit_author}) {
1541 print STDERR " Author: @{$ref}[1]\n";
dace8e30 1542 }
dace8e30 1543 }
683c6f8f
JP
1544 if ($signed{$count}) {
1545 my $commit_signer = $commit_signer_hash{$email};
1546 foreach my $ref (@{$commit_signer}) {
1547 print STDERR " @{$ref}[2]: @{$ref}[1]\n";
1548 }
1549 }
1550
1551 $count++;
1552 }
1553 }
1554 my $date_ref = \$email_git_since;
1555 $date_ref = \$email_hg_since if (vcs_is_hg());
1556 if ($print_options) {
1557 $print_options = 0;
1558 if (vcs_exists()) {
b9e2331d
JP
1559 print STDERR <<EOT
1560
1561Version Control options:
1562g use git history [$email_git]
1563gf use git-fallback [$email_git_fallback]
1564b use git blame [$email_git_blame]
1565bs use blame signatures [$email_git_blame_signatures]
1566c# minimum commits [$email_git_min_signatures]
1567%# min percent [$email_git_min_percent]
1568d# history to use [$$date_ref]
1569x# max maintainers [$email_git_max_maintainers]
1570t all signature types [$email_git_all_signature_types]
1571m use .mailmap [$email_use_mailmap]
1572EOT
dace8e30 1573 }
b9e2331d
JP
1574 print STDERR <<EOT
1575
1576Additional options:
15770 toggle all
1578tm toggle maintainers
1579tg toggle git entries
1580tl toggle open list entries
1581ts toggle subscriber list entries
1582f emails in file [$file_emails]
1583k keywords in file [$keywords]
1584r remove duplicates [$email_remove_duplicates]
1585p# pattern match depth [$pattern_depth]
1586EOT
dace8e30 1587 }
683c6f8f
JP
1588 print STDERR
1589"\n#(toggle), A#(author), S#(signed) *(all), ^(none), O(options), Y(approve): ";
1590
1591 my $input = <STDIN>;
dace8e30
FM
1592 chomp($input);
1593
683c6f8f
JP
1594 $redraw = 1;
1595 my $rerun = 0;
1596 my @wish = split(/[, ]+/, $input);
1597 foreach my $nr (@wish) {
1598 $nr = lc($nr);
1599 my $sel = substr($nr, 0, 1);
1600 my $str = substr($nr, 1);
1601 my $val = 0;
1602 $val = $1 if $str =~ /^(\d+)$/;
1603
1604 if ($sel eq "y") {
1605 $interactive = 0;
1606 $done = 1;
1607 $output_rolestats = 0;
1608 $output_roles = 0;
1609 last;
1610 } elsif ($nr =~ /^\d+$/ && $nr > 0 && $nr <= $count) {
1611 $selected{$nr - 1} = !$selected{$nr - 1};
1612 } elsif ($sel eq "*" || $sel eq '^') {
1613 my $toggle = 0;
1614 $toggle = 1 if ($sel eq '*');
1615 for (my $i = 0; $i < $count; $i++) {
1616 $selected{$i} = $toggle;
dace8e30 1617 }
683c6f8f
JP
1618 } elsif ($sel eq "0") {
1619 for (my $i = 0; $i < $count; $i++) {
1620 $selected{$i} = !$selected{$i};
1621 }
b9e2331d
JP
1622 } elsif ($sel eq "t") {
1623 if (lc($str) eq "m") {
1624 for (my $i = 0; $i < $count; $i++) {
1625 $selected{$i} = !$selected{$i}
1626 if ($list[$i]->[1] =~ /^(maintainer|supporter)/i);
1627 }
1628 } elsif (lc($str) eq "g") {
1629 for (my $i = 0; $i < $count; $i++) {
1630 $selected{$i} = !$selected{$i}
1631 if ($list[$i]->[1] =~ /^(author|commit|signer)/i);
1632 }
1633 } elsif (lc($str) eq "l") {
1634 for (my $i = 0; $i < $count; $i++) {
1635 $selected{$i} = !$selected{$i}
1636 if ($list[$i]->[1] =~ /^(open list)/i);
1637 }
1638 } elsif (lc($str) eq "s") {
1639 for (my $i = 0; $i < $count; $i++) {
1640 $selected{$i} = !$selected{$i}
1641 if ($list[$i]->[1] =~ /^(subscriber list)/i);
1642 }
1643 }
683c6f8f
JP
1644 } elsif ($sel eq "a") {
1645 if ($val > 0 && $val <= $count) {
1646 $authored{$val - 1} = !$authored{$val - 1};
1647 } elsif ($str eq '*' || $str eq '^') {
1648 my $toggle = 0;
1649 $toggle = 1 if ($str eq '*');
1650 for (my $i = 0; $i < $count; $i++) {
1651 $authored{$i} = $toggle;
1652 }
1653 }
1654 } elsif ($sel eq "s") {
1655 if ($val > 0 && $val <= $count) {
1656 $signed{$val - 1} = !$signed{$val - 1};
1657 } elsif ($str eq '*' || $str eq '^') {
1658 my $toggle = 0;
1659 $toggle = 1 if ($str eq '*');
1660 for (my $i = 0; $i < $count; $i++) {
1661 $signed{$i} = $toggle;
1662 }
1663 }
1664 } elsif ($sel eq "o") {
1665 $print_options = 1;
1666 $redraw = 1;
1667 } elsif ($sel eq "g") {
1668 if ($str eq "f") {
1669 bool_invert(\$email_git_fallback);
dace8e30 1670 } else {
683c6f8f
JP
1671 bool_invert(\$email_git);
1672 }
1673 $rerun = 1;
1674 } elsif ($sel eq "b") {
1675 if ($str eq "s") {
1676 bool_invert(\$email_git_blame_signatures);
1677 } else {
1678 bool_invert(\$email_git_blame);
1679 }
1680 $rerun = 1;
1681 } elsif ($sel eq "c") {
1682 if ($val > 0) {
1683 $email_git_min_signatures = $val;
1684 $rerun = 1;
1685 }
1686 } elsif ($sel eq "x") {
1687 if ($val > 0) {
1688 $email_git_max_maintainers = $val;
1689 $rerun = 1;
1690 }
1691 } elsif ($sel eq "%") {
1692 if ($str ne "" && $val >= 0) {
1693 $email_git_min_percent = $val;
1694 $rerun = 1;
dace8e30 1695 }
683c6f8f
JP
1696 } elsif ($sel eq "d") {
1697 if (vcs_is_git()) {
1698 $email_git_since = $str;
1699 } elsif (vcs_is_hg()) {
1700 $email_hg_since = $str;
1701 }
1702 $rerun = 1;
1703 } elsif ($sel eq "t") {
1704 bool_invert(\$email_git_all_signature_types);
1705 $rerun = 1;
1706 } elsif ($sel eq "f") {
1707 bool_invert(\$file_emails);
1708 $rerun = 1;
1709 } elsif ($sel eq "r") {
1710 bool_invert(\$email_remove_duplicates);
1711 $rerun = 1;
b9e2331d
JP
1712 } elsif ($sel eq "m") {
1713 bool_invert(\$email_use_mailmap);
1714 read_mailmap();
1715 $rerun = 1;
683c6f8f
JP
1716 } elsif ($sel eq "k") {
1717 bool_invert(\$keywords);
1718 $rerun = 1;
1719 } elsif ($sel eq "p") {
1720 if ($str ne "" && $val >= 0) {
1721 $pattern_depth = $val;
1722 $rerun = 1;
1723 }
6ef1c52e
JP
1724 } elsif ($sel eq "h" || $sel eq "?") {
1725 print STDERR <<EOT
1726
1727Interactive mode allows you to select the various maintainers, submitters,
1728commit signers and mailing lists that could be CC'd on a patch.
1729
1730Any *'d entry is selected.
1731
47abc722 1732If you have git or hg installed, you can choose to summarize the commit
6ef1c52e
JP
1733history of files in the patch. Also, each line of the current file can
1734be matched to its commit author and that commits signers with blame.
1735
1736Various knobs exist to control the length of time for active commit
1737tracking, the maximum number of commit authors and signers to add,
1738and such.
1739
1740Enter selections at the prompt until you are satisfied that the selected
1741maintainers are appropriate. You may enter multiple selections separated
1742by either commas or spaces.
1743
1744EOT
683c6f8f
JP
1745 } else {
1746 print STDERR "invalid option: '$nr'\n";
1747 $redraw = 0;
1748 }
1749 }
1750 if ($rerun) {
1751 print STDERR "git-blame can be very slow, please have patience..."
1752 if ($email_git_blame);
6ef1c52e 1753 goto &get_maintainers;
683c6f8f
JP
1754 }
1755 }
dace8e30
FM
1756
1757 #drop not selected entries
1758 $count = 0;
683c6f8f
JP
1759 my @new_emailto = ();
1760 foreach my $entry (@list) {
1761 if ($selected{$count}) {
1762 push(@new_emailto, $list[$count]);
dace8e30
FM
1763 }
1764 $count++;
1765 }
683c6f8f 1766 return @new_emailto;
dace8e30
FM
1767}
1768
683c6f8f
JP
1769sub bool_invert {
1770 my ($bool_ref) = @_;
1771
1772 if ($$bool_ref) {
1773 $$bool_ref = 0;
1774 } else {
1775 $$bool_ref = 1;
1776 }
dace8e30
FM
1777}
1778
b9e2331d
JP
1779sub deduplicate_email {
1780 my ($email) = @_;
1781
1782 my $matched = 0;
1783 my ($name, $address) = parse_email($email);
1784 $email = format_email($name, $address, 1);
1785 $email = mailmap_email($email);
1786
1787 return $email if (!$email_remove_duplicates);
1788
1789 ($name, $address) = parse_email($email);
1790
fae99206 1791 if ($name ne "" && $deduplicate_name_hash{lc($name)}) {
b9e2331d
JP
1792 $name = $deduplicate_name_hash{lc($name)}->[0];
1793 $address = $deduplicate_name_hash{lc($name)}->[1];
1794 $matched = 1;
1795 } elsif ($deduplicate_address_hash{lc($address)}) {
1796 $name = $deduplicate_address_hash{lc($address)}->[0];
1797 $address = $deduplicate_address_hash{lc($address)}->[1];
1798 $matched = 1;
1799 }
1800 if (!$matched) {
1801 $deduplicate_name_hash{lc($name)} = [ $name, $address ];
1802 $deduplicate_address_hash{lc($address)} = [ $name, $address ];
1803 }
1804 $email = format_email($name, $address, 1);
1805 $email = mailmap_email($email);
1806 return $email;
1807}
1808
683c6f8f
JP
1809sub save_commits_by_author {
1810 my (@lines) = @_;
1811
1812 my @authors = ();
1813 my @commits = ();
1814 my @subjects = ();
1815
1816 foreach my $line (@lines) {
1817 if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1818 my $author = $1;
b9e2331d 1819 $author = deduplicate_email($author);
683c6f8f
JP
1820 push(@authors, $author);
1821 }
1822 push(@commits, $1) if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
1823 push(@subjects, $1) if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
1824 }
1825
1826 for (my $i = 0; $i < @authors; $i++) {
1827 my $exists = 0;
1828 foreach my $ref(@{$commit_author_hash{$authors[$i]}}) {
1829 if (@{$ref}[0] eq $commits[$i] &&
1830 @{$ref}[1] eq $subjects[$i]) {
1831 $exists = 1;
1832 last;
1833 }
1834 }
1835 if (!$exists) {
1836 push(@{$commit_author_hash{$authors[$i]}},
1837 [ ($commits[$i], $subjects[$i]) ]);
1838 }
dace8e30 1839 }
dace8e30
FM
1840}
1841
683c6f8f
JP
1842sub save_commits_by_signer {
1843 my (@lines) = @_;
1844
1845 my $commit = "";
1846 my $subject = "";
dace8e30 1847
683c6f8f
JP
1848 foreach my $line (@lines) {
1849 $commit = $1 if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
1850 $subject = $1 if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
1851 if ($line =~ /^[ \t]*${signature_pattern}.*\@.*$/) {
1852 my @signatures = ($line);
1853 my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
1854 my @types = @$types_ref;
1855 my @signers = @$signers_ref;
1856
1857 my $type = $types[0];
1858 my $signer = $signers[0];
1859
b9e2331d 1860 $signer = deduplicate_email($signer);
6ef1c52e 1861
683c6f8f
JP
1862 my $exists = 0;
1863 foreach my $ref(@{$commit_signer_hash{$signer}}) {
1864 if (@{$ref}[0] eq $commit &&
1865 @{$ref}[1] eq $subject &&
1866 @{$ref}[2] eq $type) {
1867 $exists = 1;
1868 last;
1869 }
1870 }
1871 if (!$exists) {
1872 push(@{$commit_signer_hash{$signer}},
1873 [ ($commit, $subject, $type) ]);
1874 }
1875 }
1876 }
dace8e30
FM
1877}
1878
60db31ac 1879sub vcs_assign {
a8af2430
JP
1880 my ($role, $divisor, @lines) = @_;
1881
1882 my %hash;
1883 my $count = 0;
1884
a8af2430
JP
1885 return if (@lines <= 0);
1886
1887 if ($divisor <= 0) {
60db31ac 1888 warn("Bad divisor in " . (caller(0))[3] . ": $divisor\n");
a8af2430 1889 $divisor = 1;
3c7385b8 1890 }
8cbb3a77 1891
7fa8ff2e 1892 @lines = mailmap(@lines);
0e70e83d 1893
63ab52db
JP
1894 return if (@lines <= 0);
1895
0e70e83d 1896 @lines = sort(@lines);
11ecf53c 1897
0e70e83d 1898 # uniq -c
11ecf53c
JP
1899 $hash{$_}++ for @lines;
1900
0e70e83d 1901 # sort -rn
0e70e83d 1902 foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
11ecf53c 1903 my $sign_offs = $hash{$line};
a8af2430 1904 my $percent = $sign_offs * 100 / $divisor;
3c7385b8 1905
a8af2430 1906 $percent = 100 if ($percent > 100);
435de078 1907 next if (ignore_email_address($line));
11ecf53c
JP
1908 $count++;
1909 last if ($sign_offs < $email_git_min_signatures ||
1910 $count > $email_git_max_maintainers ||
a8af2430 1911 $percent < $email_git_min_percent);
3c7385b8 1912 push_email_address($line, '');
3c7385b8 1913 if ($output_rolestats) {
a8af2430
JP
1914 my $fmt_percent = sprintf("%.0f", $percent);
1915 add_role($line, "$role:$sign_offs/$divisor=$fmt_percent%");
1916 } else {
1917 add_role($line, $role);
3c7385b8 1918 }
f5492666
JP
1919 }
1920}
1921
60db31ac 1922sub vcs_file_signoffs {
a8af2430
JP
1923 my ($file) = @_;
1924
c9ecefea
JP
1925 my $authors_ref;
1926 my $signers_ref;
1927 my $stats_ref;
1928 my @authors = ();
a8af2430 1929 my @signers = ();
c9ecefea 1930 my @stats = ();
60db31ac 1931 my $commits;
f5492666 1932
683c6f8f
JP
1933 $vcs_used = vcs_exists();
1934 return if (!$vcs_used);
a8af2430 1935
60db31ac
JP
1936 my $cmd = $VCS_cmds{"find_signers_cmd"};
1937 $cmd =~ s/(\$\w+)/$1/eeg; # interpolate $cmd
f5492666 1938
c9ecefea
JP
1939 ($commits, $signers_ref, $authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
1940
1941 @signers = @{$signers_ref} if defined $signers_ref;
1942 @authors = @{$authors_ref} if defined $authors_ref;
1943 @stats = @{$stats_ref} if defined $stats_ref;
1944
1945# print("commits: <$commits>\nsigners:<@signers>\nauthors: <@authors>\nstats: <@stats>\n");
b9e2331d
JP
1946
1947 foreach my $signer (@signers) {
1948 $signer = deduplicate_email($signer);
1949 }
1950
60db31ac 1951 vcs_assign("commit_signer", $commits, @signers);
c9ecefea
JP
1952 vcs_assign("authored", $commits, @authors);
1953 if ($#authors == $#stats) {
1954 my $stat_pattern = $VCS_cmds{"stat_pattern"};
1955 $stat_pattern =~ s/(\$\w+)/$1/eeg; #interpolate $stat_pattern
1956
1957 my $added = 0;
1958 my $deleted = 0;
1959 for (my $i = 0; $i <= $#stats; $i++) {
1960 if ($stats[$i] =~ /$stat_pattern/) {
1961 $added += $1;
1962 $deleted += $2;
1963 }
1964 }
1965 my @tmp_authors = uniq(@authors);
1966 foreach my $author (@tmp_authors) {
1967 $author = deduplicate_email($author);
1968 }
1969 @tmp_authors = uniq(@tmp_authors);
1970 my @list_added = ();
1971 my @list_deleted = ();
1972 foreach my $author (@tmp_authors) {
1973 my $auth_added = 0;
1974 my $auth_deleted = 0;
1975 for (my $i = 0; $i <= $#stats; $i++) {
1976 if ($author eq deduplicate_email($authors[$i]) &&
1977 $stats[$i] =~ /$stat_pattern/) {
1978 $auth_added += $1;
1979 $auth_deleted += $2;
1980 }
1981 }
1982 for (my $i = 0; $i < $auth_added; $i++) {
1983 push(@list_added, $author);
1984 }
1985 for (my $i = 0; $i < $auth_deleted; $i++) {
1986 push(@list_deleted, $author);
1987 }
1988 }
1989 vcs_assign("added_lines", $added, @list_added);
1990 vcs_assign("removed_lines", $deleted, @list_deleted);
1991 }
f5492666
JP
1992}
1993
60db31ac 1994sub vcs_file_blame {
f5492666
JP
1995 my ($file) = @_;
1996
a8af2430 1997 my @signers = ();
63ab52db 1998 my @all_commits = ();
60db31ac 1999 my @commits = ();
a8af2430 2000 my $total_commits;
63ab52db 2001 my $total_lines;
f5492666 2002
683c6f8f
JP
2003 $vcs_used = vcs_exists();
2004 return if (!$vcs_used);
f5492666 2005
63ab52db
JP
2006 @all_commits = vcs_blame($file);
2007 @commits = uniq(@all_commits);
a8af2430 2008 $total_commits = @commits;
63ab52db 2009 $total_lines = @all_commits;
8cbb3a77 2010
683c6f8f
JP
2011 if ($email_git_blame_signatures) {
2012 if (vcs_is_hg()) {
2013 my $commit_count;
c9ecefea
JP
2014 my $commit_authors_ref;
2015 my $commit_signers_ref;
2016 my $stats_ref;
2017 my @commit_authors = ();
683c6f8f
JP
2018 my @commit_signers = ();
2019 my $commit = join(" -r ", @commits);
2020 my $cmd;
8cbb3a77 2021
683c6f8f
JP
2022 $cmd = $VCS_cmds{"find_commit_signers_cmd"};
2023 $cmd =~ s/(\$\w+)/$1/eeg; #substitute variables in $cmd
60db31ac 2024
c9ecefea
JP
2025 ($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2026 @commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
2027 @commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
63ab52db 2028
683c6f8f
JP
2029 push(@signers, @commit_signers);
2030 } else {
2031 foreach my $commit (@commits) {
2032 my $commit_count;
c9ecefea
JP
2033 my $commit_authors_ref;
2034 my $commit_signers_ref;
2035 my $stats_ref;
2036 my @commit_authors = ();
683c6f8f
JP
2037 my @commit_signers = ();
2038 my $cmd;
2039
2040 $cmd = $VCS_cmds{"find_commit_signers_cmd"};
2041 $cmd =~ s/(\$\w+)/$1/eeg; #substitute variables in $cmd
2042
c9ecefea
JP
2043 ($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2044 @commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
2045 @commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
683c6f8f
JP
2046
2047 push(@signers, @commit_signers);
2048 }
2049 }
f5492666
JP
2050 }
2051
a8af2430 2052 if ($from_filename) {
63ab52db
JP
2053 if ($output_rolestats) {
2054 my @blame_signers;
683c6f8f
JP
2055 if (vcs_is_hg()) {{ # Double brace for last exit
2056 my $commit_count;
2057 my @commit_signers = ();
2058 @commits = uniq(@commits);
2059 @commits = sort(@commits);
2060 my $commit = join(" -r ", @commits);
2061 my $cmd;
2062
2063 $cmd = $VCS_cmds{"find_commit_author_cmd"};
2064 $cmd =~ s/(\$\w+)/$1/eeg; #substitute variables in $cmd
2065
2066 my @lines = ();
2067
2068 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
2069
2070 if (!$email_git_penguin_chiefs) {
2071 @lines = grep(!/${penguin_chiefs}/i, @lines);
2072 }
2073
2074 last if !@lines;
2075
2076 my @authors = ();
2077 foreach my $line (@lines) {
2078 if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
2079 my $author = $1;
b9e2331d
JP
2080 $author = deduplicate_email($author);
2081 push(@authors, $author);
683c6f8f
JP
2082 }
2083 }
2084
2085 save_commits_by_author(@lines) if ($interactive);
2086 save_commits_by_signer(@lines) if ($interactive);
2087
2088 push(@signers, @authors);
2089 }}
2090 else {
2091 foreach my $commit (@commits) {
2092 my $i;
2093 my $cmd = $VCS_cmds{"find_commit_author_cmd"};
2094 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
2095 my @author = vcs_find_author($cmd);
2096 next if !@author;
b9e2331d
JP
2097
2098 my $formatted_author = deduplicate_email($author[0]);
2099
683c6f8f
JP
2100 my $count = grep(/$commit/, @all_commits);
2101 for ($i = 0; $i < $count ; $i++) {
b9e2331d 2102 push(@blame_signers, $formatted_author);
683c6f8f 2103 }
63ab52db
JP
2104 }
2105 }
2106 if (@blame_signers) {
2107 vcs_assign("authored lines", $total_lines, @blame_signers);
2108 }
2109 }
b9e2331d
JP
2110 foreach my $signer (@signers) {
2111 $signer = deduplicate_email($signer);
2112 }
60db31ac 2113 vcs_assign("commits", $total_commits, @signers);
a8af2430 2114 } else {
b9e2331d
JP
2115 foreach my $signer (@signers) {
2116 $signer = deduplicate_email($signer);
2117 }
60db31ac 2118 vcs_assign("modified commits", $total_commits, @signers);
cb7301c7 2119 }
cb7301c7
JP
2120}
2121
2122sub uniq {
a8af2430 2123 my (@parms) = @_;
cb7301c7
JP
2124
2125 my %saw;
2126 @parms = grep(!$saw{$_}++, @parms);
2127 return @parms;
2128}
2129
2130sub sort_and_uniq {
a8af2430 2131 my (@parms) = @_;
cb7301c7
JP
2132
2133 my %saw;
2134 @parms = sort @parms;
2135 @parms = grep(!$saw{$_}++, @parms);
2136 return @parms;
2137}
2138
03372dbb
JP
2139sub clean_file_emails {
2140 my (@file_emails) = @_;
2141 my @fmt_emails = ();
2142
2143 foreach my $email (@file_emails) {
2144 $email =~ s/[\(\<\{]{0,1}([A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+)[\)\>\}]{0,1}/\<$1\>/g;
2145 my ($name, $address) = parse_email($email);
2146 if ($name eq '"[,\.]"') {
2147 $name = "";
2148 }
2149
2150 my @nw = split(/[^A-Za-zÀ-ÿ\'\,\.\+-]/, $name);
2151 if (@nw > 2) {
2152 my $first = $nw[@nw - 3];
2153 my $middle = $nw[@nw - 2];
2154 my $last = $nw[@nw - 1];
2155
2156 if (((length($first) == 1 && $first =~ m/[A-Za-z]/) ||
2157 (length($first) == 2 && substr($first, -1) eq ".")) ||
2158 (length($middle) == 1 ||
2159 (length($middle) == 2 && substr($middle, -1) eq "."))) {
2160 $name = "$first $middle $last";
2161 } else {
2162 $name = "$middle $last";
2163 }
2164 }
2165
2166 if (substr($name, -1) =~ /[,\.]/) {
2167 $name = substr($name, 0, length($name) - 1);
2168 } elsif (substr($name, -2) =~ /[,\.]"/) {
2169 $name = substr($name, 0, length($name) - 2) . '"';
2170 }
2171
2172 if (substr($name, 0, 1) =~ /[,\.]/) {
2173 $name = substr($name, 1, length($name) - 1);
2174 } elsif (substr($name, 0, 2) =~ /"[,\.]/) {
2175 $name = '"' . substr($name, 2, length($name) - 2);
2176 }
2177
2178 my $fmt_email = format_email($name, $address, $email_usename);
2179 push(@fmt_emails, $fmt_email);
2180 }
2181 return @fmt_emails;
2182}
2183
3c7385b8
JP
2184sub merge_email {
2185 my @lines;
2186 my %saw;
2187
2188 for (@_) {
2189 my ($address, $role) = @$_;
2190 if (!$saw{$address}) {
2191 if ($output_roles) {
60db31ac 2192 push(@lines, "$address ($role)");
3c7385b8 2193 } else {
60db31ac 2194 push(@lines, $address);
3c7385b8
JP
2195 }
2196 $saw{$address} = 1;
2197 }
2198 }
2199
2200 return @lines;
2201}
2202
cb7301c7 2203sub output {
a8af2430 2204 my (@parms) = @_;
cb7301c7
JP
2205
2206 if ($output_multiline) {
2207 foreach my $line (@parms) {
2208 print("${line}\n");
2209 }
2210 } else {
2211 print(join($output_separator, @parms));
2212 print("\n");
2213 }
2214}
1b5e1cf6
JP
2215
2216my $rfc822re;
2217
2218sub make_rfc822re {
2219# Basic lexical tokens are specials, domain_literal, quoted_string, atom, and
2220# comment. We must allow for rfc822_lwsp (or comments) after each of these.
2221# This regexp will only work on addresses which have had comments stripped
2222# and replaced with rfc822_lwsp.
2223
2224 my $specials = '()<>@,;:\\\\".\\[\\]';
2225 my $controls = '\\000-\\037\\177';
2226
2227 my $dtext = "[^\\[\\]\\r\\\\]";
2228 my $domain_literal = "\\[(?:$dtext|\\\\.)*\\]$rfc822_lwsp*";
2229
2230 my $quoted_string = "\"(?:[^\\\"\\r\\\\]|\\\\.|$rfc822_lwsp)*\"$rfc822_lwsp*";
2231
2232# Use zero-width assertion to spot the limit of an atom. A simple
2233# $rfc822_lwsp* causes the regexp engine to hang occasionally.
2234 my $atom = "[^$specials $controls]+(?:$rfc822_lwsp+|\\Z|(?=[\\[\"$specials]))";
2235 my $word = "(?:$atom|$quoted_string)";
2236 my $localpart = "$word(?:\\.$rfc822_lwsp*$word)*";
2237
2238 my $sub_domain = "(?:$atom|$domain_literal)";
2239 my $domain = "$sub_domain(?:\\.$rfc822_lwsp*$sub_domain)*";
2240
2241 my $addr_spec = "$localpart\@$rfc822_lwsp*$domain";
2242
2243 my $phrase = "$word*";
2244 my $route = "(?:\@$domain(?:,\@$rfc822_lwsp*$domain)*:$rfc822_lwsp*)";
2245 my $route_addr = "\\<$rfc822_lwsp*$route?$addr_spec\\>$rfc822_lwsp*";
2246 my $mailbox = "(?:$addr_spec|$phrase$route_addr)";
2247
2248 my $group = "$phrase:$rfc822_lwsp*(?:$mailbox(?:,\\s*$mailbox)*)?;\\s*";
2249 my $address = "(?:$mailbox|$group)";
2250
2251 return "$rfc822_lwsp*$address";
2252}
2253
2254sub rfc822_strip_comments {
2255 my $s = shift;
2256# Recursively remove comments, and replace with a single space. The simpler
2257# regexps in the Email Addressing FAQ are imperfect - they will miss escaped
2258# chars in atoms, for example.
2259
2260 while ($s =~ s/^((?:[^"\\]|\\.)*
2261 (?:"(?:[^"\\]|\\.)*"(?:[^"\\]|\\.)*)*)
2262 \((?:[^()\\]|\\.)*\)/$1 /osx) {}
2263 return $s;
2264}
2265
2266# valid: returns true if the parameter is an RFC822 valid address
2267#
22dd5b0c 2268sub rfc822_valid {
1b5e1cf6
JP
2269 my $s = rfc822_strip_comments(shift);
2270
2271 if (!$rfc822re) {
2272 $rfc822re = make_rfc822re();
2273 }
2274
2275 return $s =~ m/^$rfc822re$/so && $s =~ m/^$rfc822_char*$/;
2276}
2277
2278# validlist: In scalar context, returns true if the parameter is an RFC822
2279# valid list of addresses.
2280#
2281# In list context, returns an empty list on failure (an invalid
2282# address was found); otherwise a list whose first element is the
2283# number of addresses found and whose remaining elements are the
2284# addresses. This is needed to disambiguate failure (invalid)
2285# from success with no addresses found, because an empty string is
2286# a valid list.
2287
22dd5b0c 2288sub rfc822_validlist {
1b5e1cf6
JP
2289 my $s = rfc822_strip_comments(shift);
2290
2291 if (!$rfc822re) {
2292 $rfc822re = make_rfc822re();
2293 }
2294 # * null list items are valid according to the RFC
2295 # * the '1' business is to aid in distinguishing failure from no results
2296
2297 my @r;
2298 if ($s =~ m/^(?:$rfc822re)?(?:,(?:$rfc822re)?)*$/so &&
2299 $s =~ m/^$rfc822_char*$/) {
5f2441e9 2300 while ($s =~ m/(?:^|,$rfc822_lwsp*)($rfc822re)/gos) {
60db31ac 2301 push(@r, $1);
1b5e1cf6
JP
2302 }
2303 return wantarray ? (scalar(@r), @r) : 1;
2304 }
60db31ac 2305 return wantarray ? () : 0;
1b5e1cf6 2306}