perf tools: Don't clone maps from parent when synthesizing forks
[linux/fpc-iii.git] / scripts / get_maintainer.pl
blobc1c088ef1420e68aa6a56bf041dd019aa82e64ee
1 #!/usr/bin/env perl
2 # SPDX-License-Identifier: GPL-2.0
4 # (c) 2007, Joe Perches <joe@perches.com>
5 # created from checkpatch.pl
7 # Print selected MAINTAINERS information for
8 # the files modified in a patch or for a file
10 # usage: perl scripts/get_maintainer.pl [OPTIONS] <patch>
11 # perl scripts/get_maintainer.pl [OPTIONS] -f <file>
13 use warnings;
14 use strict;
16 my $P = $0;
17 my $V = '0.26';
19 use Getopt::Long qw(:config no_auto_abbrev);
20 use Cwd;
21 use File::Find;
23 my $cur_path = fastgetcwd() . '/';
24 my $lk_path = "./";
25 my $email = 1;
26 my $email_usename = 1;
27 my $email_maintainer = 1;
28 my $email_reviewer = 1;
29 my $email_list = 1;
30 my $email_subscriber_list = 0;
31 my $email_git_penguin_chiefs = 0;
32 my $email_git = 0;
33 my $email_git_all_signature_types = 0;
34 my $email_git_blame = 0;
35 my $email_git_blame_signatures = 1;
36 my $email_git_fallback = 1;
37 my $email_git_min_signatures = 1;
38 my $email_git_max_maintainers = 5;
39 my $email_git_min_percent = 5;
40 my $email_git_since = "1-year-ago";
41 my $email_hg_since = "-365";
42 my $interactive = 0;
43 my $email_remove_duplicates = 1;
44 my $email_use_mailmap = 1;
45 my $output_multiline = 1;
46 my $output_separator = ", ";
47 my $output_roles = 0;
48 my $output_rolestats = 1;
49 my $output_section_maxlen = 50;
50 my $scm = 0;
51 my $tree = 1;
52 my $web = 0;
53 my $subsystem = 0;
54 my $status = 0;
55 my $letters = "";
56 my $keywords = 1;
57 my $sections = 0;
58 my $file_emails = 0;
59 my $from_filename = 0;
60 my $pattern_depth = 0;
61 my $self_test = undef;
62 my $version = 0;
63 my $help = 0;
64 my $find_maintainer_files = 0;
65 my $maintainer_path;
66 my $vcs_used = 0;
68 my $exit = 0;
70 my %commit_author_hash;
71 my %commit_signer_hash;
73 my @penguin_chief = ();
74 push(@penguin_chief, "Linus Torvalds:torvalds\@linux-foundation.org");
75 #Andrew wants in on most everything - 2009/01/14
76 #push(@penguin_chief, "Andrew Morton:akpm\@linux-foundation.org");
78 my @penguin_chief_names = ();
79 foreach my $chief (@penguin_chief) {
80 if ($chief =~ m/^(.*):(.*)/) {
81 my $chief_name = $1;
82 my $chief_addr = $2;
83 push(@penguin_chief_names, $chief_name);
86 my $penguin_chiefs = "\(" . join("|", @penguin_chief_names) . "\)";
88 # Signature types of people who are either
89 # a) responsible for the code in question, or
90 # b) familiar enough with it to give relevant feedback
91 my @signature_tags = ();
92 push(@signature_tags, "Signed-off-by:");
93 push(@signature_tags, "Reviewed-by:");
94 push(@signature_tags, "Acked-by:");
96 my $signature_pattern = "\(" . join("|", @signature_tags) . "\)";
98 # rfc822 email address - preloaded methods go here.
99 my $rfc822_lwsp = "(?:(?:\\r\\n)?[ \\t])";
100 my $rfc822_char = '[\\000-\\377]';
102 # VCS command support: class-like functions and strings
104 my %VCS_cmds;
106 my %VCS_cmds_git = (
107 "execute_cmd" => \&git_execute_cmd,
108 "available" => '(which("git") ne "") && (-e ".git")',
109 "find_signers_cmd" =>
110 "git log --no-color --follow --since=\$email_git_since " .
111 '--numstat --no-merges ' .
112 '--format="GitCommit: %H%n' .
113 'GitAuthor: %an <%ae>%n' .
114 'GitDate: %aD%n' .
115 'GitSubject: %s%n' .
116 '%b%n"' .
117 " -- \$file",
118 "find_commit_signers_cmd" =>
119 "git log --no-color " .
120 '--numstat ' .
121 '--format="GitCommit: %H%n' .
122 'GitAuthor: %an <%ae>%n' .
123 'GitDate: %aD%n' .
124 'GitSubject: %s%n' .
125 '%b%n"' .
126 " -1 \$commit",
127 "find_commit_author_cmd" =>
128 "git log --no-color " .
129 '--numstat ' .
130 '--format="GitCommit: %H%n' .
131 'GitAuthor: %an <%ae>%n' .
132 'GitDate: %aD%n' .
133 'GitSubject: %s%n"' .
134 " -1 \$commit",
135 "blame_range_cmd" => "git blame -l -L \$diff_start,+\$diff_length \$file",
136 "blame_file_cmd" => "git blame -l \$file",
137 "commit_pattern" => "^GitCommit: ([0-9a-f]{40,40})",
138 "blame_commit_pattern" => "^([0-9a-f]+) ",
139 "author_pattern" => "^GitAuthor: (.*)",
140 "subject_pattern" => "^GitSubject: (.*)",
141 "stat_pattern" => "^(\\d+)\\t(\\d+)\\t\$file\$",
142 "file_exists_cmd" => "git ls-files \$file",
143 "list_files_cmd" => "git ls-files \$file",
146 my %VCS_cmds_hg = (
147 "execute_cmd" => \&hg_execute_cmd,
148 "available" => '(which("hg") ne "") && (-d ".hg")',
149 "find_signers_cmd" =>
150 "hg log --date=\$email_hg_since " .
151 "--template='HgCommit: {node}\\n" .
152 "HgAuthor: {author}\\n" .
153 "HgSubject: {desc}\\n'" .
154 " -- \$file",
155 "find_commit_signers_cmd" =>
156 "hg log " .
157 "--template='HgSubject: {desc}\\n'" .
158 " -r \$commit",
159 "find_commit_author_cmd" =>
160 "hg log " .
161 "--template='HgCommit: {node}\\n" .
162 "HgAuthor: {author}\\n" .
163 "HgSubject: {desc|firstline}\\n'" .
164 " -r \$commit",
165 "blame_range_cmd" => "", # not supported
166 "blame_file_cmd" => "hg blame -n \$file",
167 "commit_pattern" => "^HgCommit: ([0-9a-f]{40,40})",
168 "blame_commit_pattern" => "^([ 0-9a-f]+):",
169 "author_pattern" => "^HgAuthor: (.*)",
170 "subject_pattern" => "^HgSubject: (.*)",
171 "stat_pattern" => "^(\\d+)\t(\\d+)\t\$file\$",
172 "file_exists_cmd" => "hg files \$file",
173 "list_files_cmd" => "hg manifest -R \$file",
176 my $conf = which_conf(".get_maintainer.conf");
177 if (-f $conf) {
178 my @conf_args;
179 open(my $conffile, '<', "$conf")
180 or warn "$P: Can't find a readable .get_maintainer.conf file $!\n";
182 while (<$conffile>) {
183 my $line = $_;
185 $line =~ s/\s*\n?$//g;
186 $line =~ s/^\s*//g;
187 $line =~ s/\s+/ /g;
189 next if ($line =~ m/^\s*#/);
190 next if ($line =~ m/^\s*$/);
192 my @words = split(" ", $line);
193 foreach my $word (@words) {
194 last if ($word =~ m/^#/);
195 push (@conf_args, $word);
198 close($conffile);
199 unshift(@ARGV, @conf_args) if @conf_args;
202 my @ignore_emails = ();
203 my $ignore_file = which_conf(".get_maintainer.ignore");
204 if (-f $ignore_file) {
205 open(my $ignore, '<', "$ignore_file")
206 or warn "$P: Can't find a readable .get_maintainer.ignore file $!\n";
207 while (<$ignore>) {
208 my $line = $_;
210 $line =~ s/\s*\n?$//;
211 $line =~ s/^\s*//;
212 $line =~ s/\s+$//;
213 $line =~ s/#.*$//;
215 next if ($line =~ m/^\s*$/);
216 if (rfc822_valid($line)) {
217 push(@ignore_emails, $line);
220 close($ignore);
223 if ($#ARGV > 0) {
224 foreach (@ARGV) {
225 if ($_ =~ /^-{1,2}self-test(?:=|$)/) {
226 die "$P: using --self-test does not allow any other option or argument\n";
231 if (!GetOptions(
232 'email!' => \$email,
233 'git!' => \$email_git,
234 'git-all-signature-types!' => \$email_git_all_signature_types,
235 'git-blame!' => \$email_git_blame,
236 'git-blame-signatures!' => \$email_git_blame_signatures,
237 'git-fallback!' => \$email_git_fallback,
238 'git-chief-penguins!' => \$email_git_penguin_chiefs,
239 'git-min-signatures=i' => \$email_git_min_signatures,
240 'git-max-maintainers=i' => \$email_git_max_maintainers,
241 'git-min-percent=i' => \$email_git_min_percent,
242 'git-since=s' => \$email_git_since,
243 'hg-since=s' => \$email_hg_since,
244 'i|interactive!' => \$interactive,
245 'remove-duplicates!' => \$email_remove_duplicates,
246 'mailmap!' => \$email_use_mailmap,
247 'm!' => \$email_maintainer,
248 'r!' => \$email_reviewer,
249 'n!' => \$email_usename,
250 'l!' => \$email_list,
251 's!' => \$email_subscriber_list,
252 'multiline!' => \$output_multiline,
253 'roles!' => \$output_roles,
254 'rolestats!' => \$output_rolestats,
255 'separator=s' => \$output_separator,
256 'subsystem!' => \$subsystem,
257 'status!' => \$status,
258 'scm!' => \$scm,
259 'tree!' => \$tree,
260 'web!' => \$web,
261 'letters=s' => \$letters,
262 'pattern-depth=i' => \$pattern_depth,
263 'k|keywords!' => \$keywords,
264 'sections!' => \$sections,
265 'fe|file-emails!' => \$file_emails,
266 'f|file' => \$from_filename,
267 'find-maintainer-files' => \$find_maintainer_files,
268 'mpath|maintainer-path=s' => \$maintainer_path,
269 'self-test:s' => \$self_test,
270 'v|version' => \$version,
271 'h|help|usage' => \$help,
272 )) {
273 die "$P: invalid argument - use --help if necessary\n";
276 if ($help != 0) {
277 usage();
278 exit 0;
281 if ($version != 0) {
282 print("${P} ${V}\n");
283 exit 0;
286 if (defined $self_test) {
287 read_all_maintainer_files();
288 self_test();
289 exit 0;
292 if (-t STDIN && !@ARGV) {
293 # We're talking to a terminal, but have no command line arguments.
294 die "$P: missing patchfile or -f file - use --help if necessary\n";
297 $output_multiline = 0 if ($output_separator ne ", ");
298 $output_rolestats = 1 if ($interactive);
299 $output_roles = 1 if ($output_rolestats);
301 if ($sections || $letters ne "") {
302 $sections = 1;
303 $email = 0;
304 $email_list = 0;
305 $scm = 0;
306 $status = 0;
307 $subsystem = 0;
308 $web = 0;
309 $keywords = 0;
310 $interactive = 0;
311 } else {
312 my $selections = $email + $scm + $status + $subsystem + $web;
313 if ($selections == 0) {
314 die "$P: Missing required option: email, scm, status, subsystem or web\n";
318 if ($email &&
319 ($email_maintainer + $email_reviewer +
320 $email_list + $email_subscriber_list +
321 $email_git + $email_git_penguin_chiefs + $email_git_blame) == 0) {
322 die "$P: Please select at least 1 email option\n";
325 if ($tree && !top_of_kernel_tree($lk_path)) {
326 die "$P: The current directory does not appear to be "
327 . "a linux kernel source tree.\n";
330 ## Read MAINTAINERS for type/value pairs
332 my @typevalue = ();
333 my %keyword_hash;
334 my @mfiles = ();
335 my @self_test_info = ();
337 sub read_maintainer_file {
338 my ($file) = @_;
340 open (my $maint, '<', "$file")
341 or die "$P: Can't open MAINTAINERS file '$file': $!\n";
342 my $i = 1;
343 while (<$maint>) {
344 my $line = $_;
345 chomp $line;
347 if ($line =~ m/^([A-Z]):\s*(.*)/) {
348 my $type = $1;
349 my $value = $2;
351 ##Filename pattern matching
352 if ($type eq "F" || $type eq "X") {
353 $value =~ s@\.@\\\.@g; ##Convert . to \.
354 $value =~ s/\*/\.\*/g; ##Convert * to .*
355 $value =~ s/\?/\./g; ##Convert ? to .
356 ##if pattern is a directory and it lacks a trailing slash, add one
357 if ((-d $value)) {
358 $value =~ s@([^/])$@$1/@;
360 } elsif ($type eq "K") {
361 $keyword_hash{@typevalue} = $value;
363 push(@typevalue, "$type:$value");
364 } elsif (!(/^\s*$/ || /^\s*\#/)) {
365 push(@typevalue, $line);
367 if (defined $self_test) {
368 push(@self_test_info, {file=>$file, linenr=>$i, line=>$line});
370 $i++;
372 close($maint);
375 sub find_is_maintainer_file {
376 my ($file) = $_;
377 return if ($file !~ m@/MAINTAINERS$@);
378 $file = $File::Find::name;
379 return if (! -f $file);
380 push(@mfiles, $file);
383 sub find_ignore_git {
384 return grep { $_ !~ /^\.git$/; } @_;
387 read_all_maintainer_files();
389 sub read_all_maintainer_files {
390 my $path = "${lk_path}MAINTAINERS";
391 if (defined $maintainer_path) {
392 $path = $maintainer_path;
393 # Perl Cookbook tilde expansion if necessary
394 $path =~ s@^~([^/]*)@ $1 ? (getpwnam($1))[7] : ( $ENV{HOME} || $ENV{LOGDIR} || (getpwuid($<))[7])@ex;
397 if (-d $path) {
398 $path .= '/' if ($path !~ m@/$@);
399 if ($find_maintainer_files) {
400 find( { wanted => \&find_is_maintainer_file,
401 preprocess => \&find_ignore_git,
402 no_chdir => 1,
403 }, "$path");
404 } else {
405 opendir(DIR, "$path") or die $!;
406 my @files = readdir(DIR);
407 closedir(DIR);
408 foreach my $file (@files) {
409 push(@mfiles, "$path$file") if ($file !~ /^\./);
412 } elsif (-f "$path") {
413 push(@mfiles, "$path");
414 } else {
415 die "$P: MAINTAINER file not found '$path'\n";
417 die "$P: No MAINTAINER files found in '$path'\n" if (scalar(@mfiles) == 0);
418 foreach my $file (@mfiles) {
419 read_maintainer_file("$file");
424 # Read mail address map
427 my $mailmap;
429 read_mailmap();
431 sub read_mailmap {
432 $mailmap = {
433 names => {},
434 addresses => {}
437 return if (!$email_use_mailmap || !(-f "${lk_path}.mailmap"));
439 open(my $mailmap_file, '<', "${lk_path}.mailmap")
440 or warn "$P: Can't open .mailmap: $!\n";
442 while (<$mailmap_file>) {
443 s/#.*$//; #strip comments
444 s/^\s+|\s+$//g; #trim
446 next if (/^\s*$/); #skip empty lines
447 #entries have one of the following formats:
448 # name1 <mail1>
449 # <mail1> <mail2>
450 # name1 <mail1> <mail2>
451 # name1 <mail1> name2 <mail2>
452 # (see man git-shortlog)
454 if (/^([^<]+)<([^>]+)>$/) {
455 my $real_name = $1;
456 my $address = $2;
458 $real_name =~ s/\s+$//;
459 ($real_name, $address) = parse_email("$real_name <$address>");
460 $mailmap->{names}->{$address} = $real_name;
462 } elsif (/^<([^>]+)>\s*<([^>]+)>$/) {
463 my $real_address = $1;
464 my $wrong_address = $2;
466 $mailmap->{addresses}->{$wrong_address} = $real_address;
468 } elsif (/^(.+)<([^>]+)>\s*<([^>]+)>$/) {
469 my $real_name = $1;
470 my $real_address = $2;
471 my $wrong_address = $3;
473 $real_name =~ s/\s+$//;
474 ($real_name, $real_address) =
475 parse_email("$real_name <$real_address>");
476 $mailmap->{names}->{$wrong_address} = $real_name;
477 $mailmap->{addresses}->{$wrong_address} = $real_address;
479 } elsif (/^(.+)<([^>]+)>\s*(.+)\s*<([^>]+)>$/) {
480 my $real_name = $1;
481 my $real_address = $2;
482 my $wrong_name = $3;
483 my $wrong_address = $4;
485 $real_name =~ s/\s+$//;
486 ($real_name, $real_address) =
487 parse_email("$real_name <$real_address>");
489 $wrong_name =~ s/\s+$//;
490 ($wrong_name, $wrong_address) =
491 parse_email("$wrong_name <$wrong_address>");
493 my $wrong_email = format_email($wrong_name, $wrong_address, 1);
494 $mailmap->{names}->{$wrong_email} = $real_name;
495 $mailmap->{addresses}->{$wrong_email} = $real_address;
498 close($mailmap_file);
501 ## use the filenames on the command line or find the filenames in the patchfiles
503 my @files = ();
504 my @range = ();
505 my @keyword_tvi = ();
506 my @file_emails = ();
508 if (!@ARGV) {
509 push(@ARGV, "&STDIN");
512 foreach my $file (@ARGV) {
513 if ($file ne "&STDIN") {
514 ##if $file is a directory and it lacks a trailing slash, add one
515 if ((-d $file)) {
516 $file =~ s@([^/])$@$1/@;
517 } elsif (!(-f $file)) {
518 die "$P: file '${file}' not found\n";
521 if ($from_filename || ($file ne "&STDIN" && vcs_file_exists($file))) {
522 $file =~ s/^\Q${cur_path}\E//; #strip any absolute path
523 $file =~ s/^\Q${lk_path}\E//; #or the path to the lk tree
524 push(@files, $file);
525 if ($file ne "MAINTAINERS" && -f $file && ($keywords || $file_emails)) {
526 open(my $f, '<', $file)
527 or die "$P: Can't open $file: $!\n";
528 my $text = do { local($/) ; <$f> };
529 close($f);
530 if ($keywords) {
531 foreach my $line (keys %keyword_hash) {
532 if ($text =~ m/$keyword_hash{$line}/x) {
533 push(@keyword_tvi, $line);
537 if ($file_emails) {
538 my @poss_addr = $text =~ m$[A-Za--ÿ\"\' \,\.\+-]*\s*[\,]*\s*[\(\<\{]{0,1}[A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+\.[A-Za-z0-9]+[\)\>\}]{0,1}$g;
539 push(@file_emails, clean_file_emails(@poss_addr));
542 } else {
543 my $file_cnt = @files;
544 my $lastfile;
546 open(my $patch, "< $file")
547 or die "$P: Can't open $file: $!\n";
549 # We can check arbitrary information before the patch
550 # like the commit message, mail headers, etc...
551 # This allows us to match arbitrary keywords against any part
552 # of a git format-patch generated file (subject tags, etc...)
554 my $patch_prefix = ""; #Parsing the intro
556 while (<$patch>) {
557 my $patch_line = $_;
558 if (m/^ mode change [0-7]+ => [0-7]+ (\S+)\s*$/) {
559 my $filename = $1;
560 push(@files, $filename);
561 } elsif (m/^rename (?:from|to) (\S+)\s*$/) {
562 my $filename = $1;
563 push(@files, $filename);
564 } elsif (m/^diff --git a\/(\S+) b\/(\S+)\s*$/) {
565 my $filename1 = $1;
566 my $filename2 = $2;
567 push(@files, $filename1);
568 push(@files, $filename2);
569 } elsif (m/^\+\+\+\s+(\S+)/ or m/^---\s+(\S+)/) {
570 my $filename = $1;
571 $filename =~ s@^[^/]*/@@;
572 $filename =~ s@\n@@;
573 $lastfile = $filename;
574 push(@files, $filename);
575 $patch_prefix = "^[+-].*"; #Now parsing the actual patch
576 } elsif (m/^\@\@ -(\d+),(\d+)/) {
577 if ($email_git_blame) {
578 push(@range, "$lastfile:$1:$2");
580 } elsif ($keywords) {
581 foreach my $line (keys %keyword_hash) {
582 if ($patch_line =~ m/${patch_prefix}$keyword_hash{$line}/x) {
583 push(@keyword_tvi, $line);
588 close($patch);
590 if ($file_cnt == @files) {
591 warn "$P: file '${file}' doesn't appear to be a patch. "
592 . "Add -f to options?\n";
594 @files = sort_and_uniq(@files);
598 @file_emails = uniq(@file_emails);
600 my %email_hash_name;
601 my %email_hash_address;
602 my @email_to = ();
603 my %hash_list_to;
604 my @list_to = ();
605 my @scm = ();
606 my @web = ();
607 my @subsystem = ();
608 my @status = ();
609 my %deduplicate_name_hash = ();
610 my %deduplicate_address_hash = ();
612 my @maintainers = get_maintainers();
614 if (@maintainers) {
615 @maintainers = merge_email(@maintainers);
616 output(@maintainers);
619 if ($scm) {
620 @scm = uniq(@scm);
621 output(@scm);
624 if ($status) {
625 @status = uniq(@status);
626 output(@status);
629 if ($subsystem) {
630 @subsystem = uniq(@subsystem);
631 output(@subsystem);
634 if ($web) {
635 @web = uniq(@web);
636 output(@web);
639 exit($exit);
641 sub self_test {
642 my @lsfiles = ();
643 my @good_links = ();
644 my @bad_links = ();
645 my @section_headers = ();
646 my $index = 0;
648 @lsfiles = vcs_list_files($lk_path);
650 for my $x (@self_test_info) {
651 $index++;
653 ## Section header duplication and missing section content
654 if (($self_test eq "" || $self_test =~ /\bsections\b/) &&
655 $x->{line} =~ /^\S[^:]/ &&
656 defined $self_test_info[$index] &&
657 $self_test_info[$index]->{line} =~ /^([A-Z]):\s*\S/) {
658 my $has_S = 0;
659 my $has_F = 0;
660 my $has_ML = 0;
661 my $status = "";
662 if (grep(m@^\Q$x->{line}\E@, @section_headers)) {
663 print("$x->{file}:$x->{linenr}: warning: duplicate section header\t$x->{line}\n");
664 } else {
665 push(@section_headers, $x->{line});
667 my $nextline = $index;
668 while (defined $self_test_info[$nextline] &&
669 $self_test_info[$nextline]->{line} =~ /^([A-Z]):\s*(\S.*)/) {
670 my $type = $1;
671 my $value = $2;
672 if ($type eq "S") {
673 $has_S = 1;
674 $status = $value;
675 } elsif ($type eq "F" || $type eq "N") {
676 $has_F = 1;
677 } elsif ($type eq "M" || $type eq "R" || $type eq "L") {
678 $has_ML = 1;
680 $nextline++;
682 if (!$has_ML && $status !~ /orphan|obsolete/i) {
683 print("$x->{file}:$x->{linenr}: warning: section without email address\t$x->{line}\n");
685 if (!$has_S) {
686 print("$x->{file}:$x->{linenr}: warning: section without status \t$x->{line}\n");
688 if (!$has_F) {
689 print("$x->{file}:$x->{linenr}: warning: section without file pattern\t$x->{line}\n");
693 next if ($x->{line} !~ /^([A-Z]):\s*(.*)/);
695 my $type = $1;
696 my $value = $2;
698 ## Filename pattern matching
699 if (($type eq "F" || $type eq "X") &&
700 ($self_test eq "" || $self_test =~ /\bpatterns\b/)) {
701 $value =~ s@\.@\\\.@g; ##Convert . to \.
702 $value =~ s/\*/\.\*/g; ##Convert * to .*
703 $value =~ s/\?/\./g; ##Convert ? to .
704 ##if pattern is a directory and it lacks a trailing slash, add one
705 if ((-d $value)) {
706 $value =~ s@([^/])$@$1/@;
708 if (!grep(m@^$value@, @lsfiles)) {
709 print("$x->{file}:$x->{linenr}: warning: no file matches\t$x->{line}\n");
712 ## Link reachability
713 } elsif (($type eq "W" || $type eq "Q" || $type eq "B") &&
714 $value =~ /^https?:/ &&
715 ($self_test eq "" || $self_test =~ /\blinks\b/)) {
716 next if (grep(m@^\Q$value\E$@, @good_links));
717 my $isbad = 0;
718 if (grep(m@^\Q$value\E$@, @bad_links)) {
719 $isbad = 1;
720 } else {
721 my $output = `wget --spider -q --no-check-certificate --timeout 10 --tries 1 $value`;
722 if ($? == 0) {
723 push(@good_links, $value);
724 } else {
725 push(@bad_links, $value);
726 $isbad = 1;
729 if ($isbad) {
730 print("$x->{file}:$x->{linenr}: warning: possible bad link\t$x->{line}\n");
733 ## SCM reachability
734 } elsif ($type eq "T" &&
735 ($self_test eq "" || $self_test =~ /\bscm\b/)) {
736 next if (grep(m@^\Q$value\E$@, @good_links));
737 my $isbad = 0;
738 if (grep(m@^\Q$value\E$@, @bad_links)) {
739 $isbad = 1;
740 } elsif ($value !~ /^(?:git|quilt|hg)\s+\S/) {
741 print("$x->{file}:$x->{linenr}: warning: malformed entry\t$x->{line}\n");
742 } elsif ($value =~ /^git\s+(\S+)(\s+([^\(]+\S+))?/) {
743 my $url = $1;
744 my $branch = "";
745 $branch = $3 if $3;
746 my $output = `git ls-remote --exit-code -h "$url" $branch > /dev/null 2>&1`;
747 if ($? == 0) {
748 push(@good_links, $value);
749 } else {
750 push(@bad_links, $value);
751 $isbad = 1;
753 } elsif ($value =~ /^(?:quilt|hg)\s+(https?:\S+)/) {
754 my $url = $1;
755 my $output = `wget --spider -q --no-check-certificate --timeout 10 --tries 1 $url`;
756 if ($? == 0) {
757 push(@good_links, $value);
758 } else {
759 push(@bad_links, $value);
760 $isbad = 1;
763 if ($isbad) {
764 print("$x->{file}:$x->{linenr}: warning: possible bad link\t$x->{line}\n");
770 sub ignore_email_address {
771 my ($address) = @_;
773 foreach my $ignore (@ignore_emails) {
774 return 1 if ($ignore eq $address);
777 return 0;
780 sub range_is_maintained {
781 my ($start, $end) = @_;
783 for (my $i = $start; $i < $end; $i++) {
784 my $line = $typevalue[$i];
785 if ($line =~ m/^([A-Z]):\s*(.*)/) {
786 my $type = $1;
787 my $value = $2;
788 if ($type eq 'S') {
789 if ($value =~ /(maintain|support)/i) {
790 return 1;
795 return 0;
798 sub range_has_maintainer {
799 my ($start, $end) = @_;
801 for (my $i = $start; $i < $end; $i++) {
802 my $line = $typevalue[$i];
803 if ($line =~ m/^([A-Z]):\s*(.*)/) {
804 my $type = $1;
805 my $value = $2;
806 if ($type eq 'M') {
807 return 1;
811 return 0;
814 sub get_maintainers {
815 %email_hash_name = ();
816 %email_hash_address = ();
817 %commit_author_hash = ();
818 %commit_signer_hash = ();
819 @email_to = ();
820 %hash_list_to = ();
821 @list_to = ();
822 @scm = ();
823 @web = ();
824 @subsystem = ();
825 @status = ();
826 %deduplicate_name_hash = ();
827 %deduplicate_address_hash = ();
828 if ($email_git_all_signature_types) {
829 $signature_pattern = "(.+?)[Bb][Yy]:";
830 } else {
831 $signature_pattern = "\(" . join("|", @signature_tags) . "\)";
834 # Find responsible parties
836 my %exact_pattern_match_hash = ();
838 foreach my $file (@files) {
840 my %hash;
841 my $tvi = find_first_section();
842 while ($tvi < @typevalue) {
843 my $start = find_starting_index($tvi);
844 my $end = find_ending_index($tvi);
845 my $exclude = 0;
846 my $i;
848 #Do not match excluded file patterns
850 for ($i = $start; $i < $end; $i++) {
851 my $line = $typevalue[$i];
852 if ($line =~ m/^([A-Z]):\s*(.*)/) {
853 my $type = $1;
854 my $value = $2;
855 if ($type eq 'X') {
856 if (file_match_pattern($file, $value)) {
857 $exclude = 1;
858 last;
864 if (!$exclude) {
865 for ($i = $start; $i < $end; $i++) {
866 my $line = $typevalue[$i];
867 if ($line =~ m/^([A-Z]):\s*(.*)/) {
868 my $type = $1;
869 my $value = $2;
870 if ($type eq 'F') {
871 if (file_match_pattern($file, $value)) {
872 my $value_pd = ($value =~ tr@/@@);
873 my $file_pd = ($file =~ tr@/@@);
874 $value_pd++ if (substr($value,-1,1) ne "/");
875 $value_pd = -1 if ($value =~ /^\.\*/);
876 if ($value_pd >= $file_pd &&
877 range_is_maintained($start, $end) &&
878 range_has_maintainer($start, $end)) {
879 $exact_pattern_match_hash{$file} = 1;
881 if ($pattern_depth == 0 ||
882 (($file_pd - $value_pd) < $pattern_depth)) {
883 $hash{$tvi} = $value_pd;
886 } elsif ($type eq 'N') {
887 if ($file =~ m/$value/x) {
888 $hash{$tvi} = 0;
894 $tvi = $end + 1;
897 foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
898 add_categories($line);
899 if ($sections) {
900 my $i;
901 my $start = find_starting_index($line);
902 my $end = find_ending_index($line);
903 for ($i = $start; $i < $end; $i++) {
904 my $line = $typevalue[$i];
905 if ($line =~ /^[FX]:/) { ##Restore file patterns
906 $line =~ s/([^\\])\.([^\*])/$1\?$2/g;
907 $line =~ s/([^\\])\.$/$1\?/g; ##Convert . back to ?
908 $line =~ s/\\\./\./g; ##Convert \. to .
909 $line =~ s/\.\*/\*/g; ##Convert .* to *
911 my $count = $line =~ s/^([A-Z]):/$1:\t/g;
912 if ($letters eq "" || (!$count || $letters =~ /$1/i)) {
913 print("$line\n");
916 print("\n");
921 if ($keywords) {
922 @keyword_tvi = sort_and_uniq(@keyword_tvi);
923 foreach my $line (@keyword_tvi) {
924 add_categories($line);
928 foreach my $email (@email_to, @list_to) {
929 $email->[0] = deduplicate_email($email->[0]);
932 foreach my $file (@files) {
933 if ($email &&
934 ($email_git || ($email_git_fallback &&
935 !$exact_pattern_match_hash{$file}))) {
936 vcs_file_signoffs($file);
938 if ($email && $email_git_blame) {
939 vcs_file_blame($file);
943 if ($email) {
944 foreach my $chief (@penguin_chief) {
945 if ($chief =~ m/^(.*):(.*)/) {
946 my $email_address;
948 $email_address = format_email($1, $2, $email_usename);
949 if ($email_git_penguin_chiefs) {
950 push(@email_to, [$email_address, 'chief penguin']);
951 } else {
952 @email_to = grep($_->[0] !~ /${email_address}/, @email_to);
957 foreach my $email (@file_emails) {
958 my ($name, $address) = parse_email($email);
960 my $tmp_email = format_email($name, $address, $email_usename);
961 push_email_address($tmp_email, '');
962 add_role($tmp_email, 'in file');
966 my @to = ();
967 if ($email || $email_list) {
968 if ($email) {
969 @to = (@to, @email_to);
971 if ($email_list) {
972 @to = (@to, @list_to);
976 if ($interactive) {
977 @to = interactive_get_maintainers(\@to);
980 return @to;
983 sub file_match_pattern {
984 my ($file, $pattern) = @_;
985 if (substr($pattern, -1) eq "/") {
986 if ($file =~ m@^$pattern@) {
987 return 1;
989 } else {
990 if ($file =~ m@^$pattern@) {
991 my $s1 = ($file =~ tr@/@@);
992 my $s2 = ($pattern =~ tr@/@@);
993 if ($s1 == $s2) {
994 return 1;
998 return 0;
1001 sub usage {
1002 print <<EOT;
1003 usage: $P [options] patchfile
1004 $P [options] -f file|directory
1005 version: $V
1007 MAINTAINER field selection options:
1008 --email => print email address(es) if any
1009 --git => include recent git \*-by: signers
1010 --git-all-signature-types => include signers regardless of signature type
1011 or use only ${signature_pattern} signers (default: $email_git_all_signature_types)
1012 --git-fallback => use git when no exact MAINTAINERS pattern (default: $email_git_fallback)
1013 --git-chief-penguins => include ${penguin_chiefs}
1014 --git-min-signatures => number of signatures required (default: $email_git_min_signatures)
1015 --git-max-maintainers => maximum maintainers to add (default: $email_git_max_maintainers)
1016 --git-min-percent => minimum percentage of commits required (default: $email_git_min_percent)
1017 --git-blame => use git blame to find modified commits for patch or file
1018 --git-blame-signatures => when used with --git-blame, also include all commit signers
1019 --git-since => git history to use (default: $email_git_since)
1020 --hg-since => hg history to use (default: $email_hg_since)
1021 --interactive => display a menu (mostly useful if used with the --git option)
1022 --m => include maintainer(s) if any
1023 --r => include reviewer(s) if any
1024 --n => include name 'Full Name <addr\@domain.tld>'
1025 --l => include list(s) if any
1026 --s => include subscriber only list(s) if any
1027 --remove-duplicates => minimize duplicate email names/addresses
1028 --roles => show roles (status:subsystem, git-signer, list, etc...)
1029 --rolestats => show roles and statistics (commits/total_commits, %)
1030 --file-emails => add email addresses found in -f file (default: 0 (off))
1031 --scm => print SCM tree(s) if any
1032 --status => print status if any
1033 --subsystem => print subsystem name if any
1034 --web => print website(s) if any
1036 Output type options:
1037 --separator [, ] => separator for multiple entries on 1 line
1038 using --separator also sets --nomultiline if --separator is not [, ]
1039 --multiline => print 1 entry per line
1041 Other options:
1042 --pattern-depth => Number of pattern directory traversals (default: 0 (all))
1043 --keywords => scan patch for keywords (default: $keywords)
1044 --sections => print all of the subsystem sections with pattern matches
1045 --letters => print all matching 'letter' types from all matching sections
1046 --mailmap => use .mailmap file (default: $email_use_mailmap)
1047 --no-tree => run without a kernel tree
1048 --self-test => show potential issues with MAINTAINERS file content
1049 --version => show version
1050 --help => show this help information
1052 Default options:
1053 [--email --tree --nogit --git-fallback --m --r --n --l --multiline
1054 --pattern-depth=0 --remove-duplicates --rolestats]
1056 Notes:
1057 Using "-f directory" may give unexpected results:
1058 Used with "--git", git signators for _all_ files in and below
1059 directory are examined as git recurses directories.
1060 Any specified X: (exclude) pattern matches are _not_ ignored.
1061 Used with "--nogit", directory is used as a pattern match,
1062 no individual file within the directory or subdirectory
1063 is matched.
1064 Used with "--git-blame", does not iterate all files in directory
1065 Using "--git-blame" is slow and may add old committers and authors
1066 that are no longer active maintainers to the output.
1067 Using "--roles" or "--rolestats" with git send-email --cc-cmd or any
1068 other automated tools that expect only ["name"] <email address>
1069 may not work because of additional output after <email address>.
1070 Using "--rolestats" and "--git-blame" shows the #/total=% commits,
1071 not the percentage of the entire file authored. # of commits is
1072 not a good measure of amount of code authored. 1 major commit may
1073 contain a thousand lines, 5 trivial commits may modify a single line.
1074 If git is not installed, but mercurial (hg) is installed and an .hg
1075 repository exists, the following options apply to mercurial:
1076 --git,
1077 --git-min-signatures, --git-max-maintainers, --git-min-percent, and
1078 --git-blame
1079 Use --hg-since not --git-since to control date selection
1080 File ".get_maintainer.conf", if it exists in the linux kernel source root
1081 directory, can change whatever get_maintainer defaults are desired.
1082 Entries in this file can be any command line argument.
1083 This file is prepended to any additional command line arguments.
1084 Multiple lines and # comments are allowed.
1085 Most options have both positive and negative forms.
1086 The negative forms for --<foo> are --no<foo> and --no-<foo>.
1091 sub top_of_kernel_tree {
1092 my ($lk_path) = @_;
1094 if ($lk_path ne "" && substr($lk_path,length($lk_path)-1,1) ne "/") {
1095 $lk_path .= "/";
1097 if ( (-f "${lk_path}COPYING")
1098 && (-f "${lk_path}CREDITS")
1099 && (-f "${lk_path}Kbuild")
1100 && (-e "${lk_path}MAINTAINERS")
1101 && (-f "${lk_path}Makefile")
1102 && (-f "${lk_path}README")
1103 && (-d "${lk_path}Documentation")
1104 && (-d "${lk_path}arch")
1105 && (-d "${lk_path}include")
1106 && (-d "${lk_path}drivers")
1107 && (-d "${lk_path}fs")
1108 && (-d "${lk_path}init")
1109 && (-d "${lk_path}ipc")
1110 && (-d "${lk_path}kernel")
1111 && (-d "${lk_path}lib")
1112 && (-d "${lk_path}scripts")) {
1113 return 1;
1115 return 0;
1118 sub parse_email {
1119 my ($formatted_email) = @_;
1121 my $name = "";
1122 my $address = "";
1124 if ($formatted_email =~ /^([^<]+)<(.+\@.*)>.*$/) {
1125 $name = $1;
1126 $address = $2;
1127 } elsif ($formatted_email =~ /^\s*<(.+\@\S*)>.*$/) {
1128 $address = $1;
1129 } elsif ($formatted_email =~ /^(.+\@\S*).*$/) {
1130 $address = $1;
1133 $name =~ s/^\s+|\s+$//g;
1134 $name =~ s/^\"|\"$//g;
1135 $address =~ s/^\s+|\s+$//g;
1137 if ($name =~ /[^\w \-]/i) { ##has "must quote" chars
1138 $name =~ s/(?<!\\)"/\\"/g; ##escape quotes
1139 $name = "\"$name\"";
1142 return ($name, $address);
1145 sub format_email {
1146 my ($name, $address, $usename) = @_;
1148 my $formatted_email;
1150 $name =~ s/^\s+|\s+$//g;
1151 $name =~ s/^\"|\"$//g;
1152 $address =~ s/^\s+|\s+$//g;
1154 if ($name =~ /[^\w \-]/i) { ##has "must quote" chars
1155 $name =~ s/(?<!\\)"/\\"/g; ##escape quotes
1156 $name = "\"$name\"";
1159 if ($usename) {
1160 if ("$name" eq "") {
1161 $formatted_email = "$address";
1162 } else {
1163 $formatted_email = "$name <$address>";
1165 } else {
1166 $formatted_email = $address;
1169 return $formatted_email;
1172 sub find_first_section {
1173 my $index = 0;
1175 while ($index < @typevalue) {
1176 my $tv = $typevalue[$index];
1177 if (($tv =~ m/^([A-Z]):\s*(.*)/)) {
1178 last;
1180 $index++;
1183 return $index;
1186 sub find_starting_index {
1187 my ($index) = @_;
1189 while ($index > 0) {
1190 my $tv = $typevalue[$index];
1191 if (!($tv =~ m/^([A-Z]):\s*(.*)/)) {
1192 last;
1194 $index--;
1197 return $index;
1200 sub find_ending_index {
1201 my ($index) = @_;
1203 while ($index < @typevalue) {
1204 my $tv = $typevalue[$index];
1205 if (!($tv =~ m/^([A-Z]):\s*(.*)/)) {
1206 last;
1208 $index++;
1211 return $index;
1214 sub get_subsystem_name {
1215 my ($index) = @_;
1217 my $start = find_starting_index($index);
1219 my $subsystem = $typevalue[$start];
1220 if ($output_section_maxlen && length($subsystem) > $output_section_maxlen) {
1221 $subsystem = substr($subsystem, 0, $output_section_maxlen - 3);
1222 $subsystem =~ s/\s*$//;
1223 $subsystem = $subsystem . "...";
1225 return $subsystem;
1228 sub get_maintainer_role {
1229 my ($index) = @_;
1231 my $i;
1232 my $start = find_starting_index($index);
1233 my $end = find_ending_index($index);
1235 my $role = "unknown";
1236 my $subsystem = get_subsystem_name($index);
1238 for ($i = $start + 1; $i < $end; $i++) {
1239 my $tv = $typevalue[$i];
1240 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
1241 my $ptype = $1;
1242 my $pvalue = $2;
1243 if ($ptype eq "S") {
1244 $role = $pvalue;
1249 $role = lc($role);
1250 if ($role eq "supported") {
1251 $role = "supporter";
1252 } elsif ($role eq "maintained") {
1253 $role = "maintainer";
1254 } elsif ($role eq "odd fixes") {
1255 $role = "odd fixer";
1256 } elsif ($role eq "orphan") {
1257 $role = "orphan minder";
1258 } elsif ($role eq "obsolete") {
1259 $role = "obsolete minder";
1260 } elsif ($role eq "buried alive in reporters") {
1261 $role = "chief penguin";
1264 return $role . ":" . $subsystem;
1267 sub get_list_role {
1268 my ($index) = @_;
1270 my $subsystem = get_subsystem_name($index);
1272 if ($subsystem eq "THE REST") {
1273 $subsystem = "";
1276 return $subsystem;
1279 sub add_categories {
1280 my ($index) = @_;
1282 my $i;
1283 my $start = find_starting_index($index);
1284 my $end = find_ending_index($index);
1286 push(@subsystem, $typevalue[$start]);
1288 for ($i = $start + 1; $i < $end; $i++) {
1289 my $tv = $typevalue[$i];
1290 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
1291 my $ptype = $1;
1292 my $pvalue = $2;
1293 if ($ptype eq "L") {
1294 my $list_address = $pvalue;
1295 my $list_additional = "";
1296 my $list_role = get_list_role($i);
1298 if ($list_role ne "") {
1299 $list_role = ":" . $list_role;
1301 if ($list_address =~ m/([^\s]+)\s+(.*)$/) {
1302 $list_address = $1;
1303 $list_additional = $2;
1305 if ($list_additional =~ m/subscribers-only/) {
1306 if ($email_subscriber_list) {
1307 if (!$hash_list_to{lc($list_address)}) {
1308 $hash_list_to{lc($list_address)} = 1;
1309 push(@list_to, [$list_address,
1310 "subscriber list${list_role}"]);
1313 } else {
1314 if ($email_list) {
1315 if (!$hash_list_to{lc($list_address)}) {
1316 $hash_list_to{lc($list_address)} = 1;
1317 if ($list_additional =~ m/moderated/) {
1318 push(@list_to, [$list_address,
1319 "moderated list${list_role}"]);
1320 } else {
1321 push(@list_to, [$list_address,
1322 "open list${list_role}"]);
1327 } elsif ($ptype eq "M") {
1328 my ($name, $address) = parse_email($pvalue);
1329 if ($name eq "") {
1330 if ($i > 0) {
1331 my $tv = $typevalue[$i - 1];
1332 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
1333 if ($1 eq "P") {
1334 $name = $2;
1335 $pvalue = format_email($name, $address, $email_usename);
1340 if ($email_maintainer) {
1341 my $role = get_maintainer_role($i);
1342 push_email_addresses($pvalue, $role);
1344 } elsif ($ptype eq "R") {
1345 my ($name, $address) = parse_email($pvalue);
1346 if ($name eq "") {
1347 if ($i > 0) {
1348 my $tv = $typevalue[$i - 1];
1349 if ($tv =~ m/^([A-Z]):\s*(.*)/) {
1350 if ($1 eq "P") {
1351 $name = $2;
1352 $pvalue = format_email($name, $address, $email_usename);
1357 if ($email_reviewer) {
1358 my $subsystem = get_subsystem_name($i);
1359 push_email_addresses($pvalue, "reviewer:$subsystem");
1361 } elsif ($ptype eq "T") {
1362 push(@scm, $pvalue);
1363 } elsif ($ptype eq "W") {
1364 push(@web, $pvalue);
1365 } elsif ($ptype eq "S") {
1366 push(@status, $pvalue);
1372 sub email_inuse {
1373 my ($name, $address) = @_;
1375 return 1 if (($name eq "") && ($address eq ""));
1376 return 1 if (($name ne "") && exists($email_hash_name{lc($name)}));
1377 return 1 if (($address ne "") && exists($email_hash_address{lc($address)}));
1379 return 0;
1382 sub push_email_address {
1383 my ($line, $role) = @_;
1385 my ($name, $address) = parse_email($line);
1387 if ($address eq "") {
1388 return 0;
1391 if (!$email_remove_duplicates) {
1392 push(@email_to, [format_email($name, $address, $email_usename), $role]);
1393 } elsif (!email_inuse($name, $address)) {
1394 push(@email_to, [format_email($name, $address, $email_usename), $role]);
1395 $email_hash_name{lc($name)}++ if ($name ne "");
1396 $email_hash_address{lc($address)}++;
1399 return 1;
1402 sub push_email_addresses {
1403 my ($address, $role) = @_;
1405 my @address_list = ();
1407 if (rfc822_valid($address)) {
1408 push_email_address($address, $role);
1409 } elsif (@address_list = rfc822_validlist($address)) {
1410 my $array_count = shift(@address_list);
1411 while (my $entry = shift(@address_list)) {
1412 push_email_address($entry, $role);
1414 } else {
1415 if (!push_email_address($address, $role)) {
1416 warn("Invalid MAINTAINERS address: '" . $address . "'\n");
1421 sub add_role {
1422 my ($line, $role) = @_;
1424 my ($name, $address) = parse_email($line);
1425 my $email = format_email($name, $address, $email_usename);
1427 foreach my $entry (@email_to) {
1428 if ($email_remove_duplicates) {
1429 my ($entry_name, $entry_address) = parse_email($entry->[0]);
1430 if (($name eq $entry_name || $address eq $entry_address)
1431 && ($role eq "" || !($entry->[1] =~ m/$role/))
1433 if ($entry->[1] eq "") {
1434 $entry->[1] = "$role";
1435 } else {
1436 $entry->[1] = "$entry->[1],$role";
1439 } else {
1440 if ($email eq $entry->[0]
1441 && ($role eq "" || !($entry->[1] =~ m/$role/))
1443 if ($entry->[1] eq "") {
1444 $entry->[1] = "$role";
1445 } else {
1446 $entry->[1] = "$entry->[1],$role";
1453 sub which {
1454 my ($bin) = @_;
1456 foreach my $path (split(/:/, $ENV{PATH})) {
1457 if (-e "$path/$bin") {
1458 return "$path/$bin";
1462 return "";
1465 sub which_conf {
1466 my ($conf) = @_;
1468 foreach my $path (split(/:/, ".:$ENV{HOME}:.scripts")) {
1469 if (-e "$path/$conf") {
1470 return "$path/$conf";
1474 return "";
1477 sub mailmap_email {
1478 my ($line) = @_;
1480 my ($name, $address) = parse_email($line);
1481 my $email = format_email($name, $address, 1);
1482 my $real_name = $name;
1483 my $real_address = $address;
1485 if (exists $mailmap->{names}->{$email} ||
1486 exists $mailmap->{addresses}->{$email}) {
1487 if (exists $mailmap->{names}->{$email}) {
1488 $real_name = $mailmap->{names}->{$email};
1490 if (exists $mailmap->{addresses}->{$email}) {
1491 $real_address = $mailmap->{addresses}->{$email};
1493 } else {
1494 if (exists $mailmap->{names}->{$address}) {
1495 $real_name = $mailmap->{names}->{$address};
1497 if (exists $mailmap->{addresses}->{$address}) {
1498 $real_address = $mailmap->{addresses}->{$address};
1501 return format_email($real_name, $real_address, 1);
1504 sub mailmap {
1505 my (@addresses) = @_;
1507 my @mapped_emails = ();
1508 foreach my $line (@addresses) {
1509 push(@mapped_emails, mailmap_email($line));
1511 merge_by_realname(@mapped_emails) if ($email_use_mailmap);
1512 return @mapped_emails;
1515 sub merge_by_realname {
1516 my %address_map;
1517 my (@emails) = @_;
1519 foreach my $email (@emails) {
1520 my ($name, $address) = parse_email($email);
1521 if (exists $address_map{$name}) {
1522 $address = $address_map{$name};
1523 $email = format_email($name, $address, 1);
1524 } else {
1525 $address_map{$name} = $address;
1530 sub git_execute_cmd {
1531 my ($cmd) = @_;
1532 my @lines = ();
1534 my $output = `$cmd`;
1535 $output =~ s/^\s*//gm;
1536 @lines = split("\n", $output);
1538 return @lines;
1541 sub hg_execute_cmd {
1542 my ($cmd) = @_;
1543 my @lines = ();
1545 my $output = `$cmd`;
1546 @lines = split("\n", $output);
1548 return @lines;
1551 sub extract_formatted_signatures {
1552 my (@signature_lines) = @_;
1554 my @type = @signature_lines;
1556 s/\s*(.*):.*/$1/ for (@type);
1558 # cut -f2- -d":"
1559 s/\s*.*:\s*(.+)\s*/$1/ for (@signature_lines);
1561 ## Reformat email addresses (with names) to avoid badly written signatures
1563 foreach my $signer (@signature_lines) {
1564 $signer = deduplicate_email($signer);
1567 return (\@type, \@signature_lines);
1570 sub vcs_find_signers {
1571 my ($cmd, $file) = @_;
1572 my $commits;
1573 my @lines = ();
1574 my @signatures = ();
1575 my @authors = ();
1576 my @stats = ();
1578 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1580 my $pattern = $VCS_cmds{"commit_pattern"};
1581 my $author_pattern = $VCS_cmds{"author_pattern"};
1582 my $stat_pattern = $VCS_cmds{"stat_pattern"};
1584 $stat_pattern =~ s/(\$\w+)/$1/eeg; #interpolate $stat_pattern
1586 $commits = grep(/$pattern/, @lines); # of commits
1588 @authors = grep(/$author_pattern/, @lines);
1589 @signatures = grep(/^[ \t]*${signature_pattern}.*\@.*$/, @lines);
1590 @stats = grep(/$stat_pattern/, @lines);
1592 # print("stats: <@stats>\n");
1594 return (0, \@signatures, \@authors, \@stats) if !@signatures;
1596 save_commits_by_author(@lines) if ($interactive);
1597 save_commits_by_signer(@lines) if ($interactive);
1599 if (!$email_git_penguin_chiefs) {
1600 @signatures = grep(!/${penguin_chiefs}/i, @signatures);
1603 my ($author_ref, $authors_ref) = extract_formatted_signatures(@authors);
1604 my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
1606 return ($commits, $signers_ref, $authors_ref, \@stats);
1609 sub vcs_find_author {
1610 my ($cmd) = @_;
1611 my @lines = ();
1613 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1615 if (!$email_git_penguin_chiefs) {
1616 @lines = grep(!/${penguin_chiefs}/i, @lines);
1619 return @lines if !@lines;
1621 my @authors = ();
1622 foreach my $line (@lines) {
1623 if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
1624 my $author = $1;
1625 my ($name, $address) = parse_email($author);
1626 $author = format_email($name, $address, 1);
1627 push(@authors, $author);
1631 save_commits_by_author(@lines) if ($interactive);
1632 save_commits_by_signer(@lines) if ($interactive);
1634 return @authors;
1637 sub vcs_save_commits {
1638 my ($cmd) = @_;
1639 my @lines = ();
1640 my @commits = ();
1642 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
1644 foreach my $line (@lines) {
1645 if ($line =~ m/$VCS_cmds{"blame_commit_pattern"}/) {
1646 push(@commits, $1);
1650 return @commits;
1653 sub vcs_blame {
1654 my ($file) = @_;
1655 my $cmd;
1656 my @commits = ();
1658 return @commits if (!(-f $file));
1660 if (@range && $VCS_cmds{"blame_range_cmd"} eq "") {
1661 my @all_commits = ();
1663 $cmd = $VCS_cmds{"blame_file_cmd"};
1664 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
1665 @all_commits = vcs_save_commits($cmd);
1667 foreach my $file_range_diff (@range) {
1668 next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1669 my $diff_file = $1;
1670 my $diff_start = $2;
1671 my $diff_length = $3;
1672 next if ("$file" ne "$diff_file");
1673 for (my $i = $diff_start; $i < $diff_start + $diff_length; $i++) {
1674 push(@commits, $all_commits[$i]);
1677 } elsif (@range) {
1678 foreach my $file_range_diff (@range) {
1679 next if (!($file_range_diff =~ m/(.+):(.+):(.+)/));
1680 my $diff_file = $1;
1681 my $diff_start = $2;
1682 my $diff_length = $3;
1683 next if ("$file" ne "$diff_file");
1684 $cmd = $VCS_cmds{"blame_range_cmd"};
1685 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
1686 push(@commits, vcs_save_commits($cmd));
1688 } else {
1689 $cmd = $VCS_cmds{"blame_file_cmd"};
1690 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
1691 @commits = vcs_save_commits($cmd);
1694 foreach my $commit (@commits) {
1695 $commit =~ s/^\^//g;
1698 return @commits;
1701 my $printed_novcs = 0;
1702 sub vcs_exists {
1703 %VCS_cmds = %VCS_cmds_git;
1704 return 1 if eval $VCS_cmds{"available"};
1705 %VCS_cmds = %VCS_cmds_hg;
1706 return 2 if eval $VCS_cmds{"available"};
1707 %VCS_cmds = ();
1708 if (!$printed_novcs) {
1709 warn("$P: No supported VCS found. Add --nogit to options?\n");
1710 warn("Using a git repository produces better results.\n");
1711 warn("Try Linus Torvalds' latest git repository using:\n");
1712 warn("git clone git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git\n");
1713 $printed_novcs = 1;
1715 return 0;
1718 sub vcs_is_git {
1719 vcs_exists();
1720 return $vcs_used == 1;
1723 sub vcs_is_hg {
1724 return $vcs_used == 2;
1727 sub interactive_get_maintainers {
1728 my ($list_ref) = @_;
1729 my @list = @$list_ref;
1731 vcs_exists();
1733 my %selected;
1734 my %authored;
1735 my %signed;
1736 my $count = 0;
1737 my $maintained = 0;
1738 foreach my $entry (@list) {
1739 $maintained = 1 if ($entry->[1] =~ /^(maintainer|supporter)/i);
1740 $selected{$count} = 1;
1741 $authored{$count} = 0;
1742 $signed{$count} = 0;
1743 $count++;
1746 #menu loop
1747 my $done = 0;
1748 my $print_options = 0;
1749 my $redraw = 1;
1750 while (!$done) {
1751 $count = 0;
1752 if ($redraw) {
1753 printf STDERR "\n%1s %2s %-65s",
1754 "*", "#", "email/list and role:stats";
1755 if ($email_git ||
1756 ($email_git_fallback && !$maintained) ||
1757 $email_git_blame) {
1758 print STDERR "auth sign";
1760 print STDERR "\n";
1761 foreach my $entry (@list) {
1762 my $email = $entry->[0];
1763 my $role = $entry->[1];
1764 my $sel = "";
1765 $sel = "*" if ($selected{$count});
1766 my $commit_author = $commit_author_hash{$email};
1767 my $commit_signer = $commit_signer_hash{$email};
1768 my $authored = 0;
1769 my $signed = 0;
1770 $authored++ for (@{$commit_author});
1771 $signed++ for (@{$commit_signer});
1772 printf STDERR "%1s %2d %-65s", $sel, $count + 1, $email;
1773 printf STDERR "%4d %4d", $authored, $signed
1774 if ($authored > 0 || $signed > 0);
1775 printf STDERR "\n %s\n", $role;
1776 if ($authored{$count}) {
1777 my $commit_author = $commit_author_hash{$email};
1778 foreach my $ref (@{$commit_author}) {
1779 print STDERR " Author: @{$ref}[1]\n";
1782 if ($signed{$count}) {
1783 my $commit_signer = $commit_signer_hash{$email};
1784 foreach my $ref (@{$commit_signer}) {
1785 print STDERR " @{$ref}[2]: @{$ref}[1]\n";
1789 $count++;
1792 my $date_ref = \$email_git_since;
1793 $date_ref = \$email_hg_since if (vcs_is_hg());
1794 if ($print_options) {
1795 $print_options = 0;
1796 if (vcs_exists()) {
1797 print STDERR <<EOT
1799 Version Control options:
1800 g use git history [$email_git]
1801 gf use git-fallback [$email_git_fallback]
1802 b use git blame [$email_git_blame]
1803 bs use blame signatures [$email_git_blame_signatures]
1804 c# minimum commits [$email_git_min_signatures]
1805 %# min percent [$email_git_min_percent]
1806 d# history to use [$$date_ref]
1807 x# max maintainers [$email_git_max_maintainers]
1808 t all signature types [$email_git_all_signature_types]
1809 m use .mailmap [$email_use_mailmap]
1812 print STDERR <<EOT
1814 Additional options:
1815 0 toggle all
1816 tm toggle maintainers
1817 tg toggle git entries
1818 tl toggle open list entries
1819 ts toggle subscriber list entries
1820 f emails in file [$file_emails]
1821 k keywords in file [$keywords]
1822 r remove duplicates [$email_remove_duplicates]
1823 p# pattern match depth [$pattern_depth]
1826 print STDERR
1827 "\n#(toggle), A#(author), S#(signed) *(all), ^(none), O(options), Y(approve): ";
1829 my $input = <STDIN>;
1830 chomp($input);
1832 $redraw = 1;
1833 my $rerun = 0;
1834 my @wish = split(/[, ]+/, $input);
1835 foreach my $nr (@wish) {
1836 $nr = lc($nr);
1837 my $sel = substr($nr, 0, 1);
1838 my $str = substr($nr, 1);
1839 my $val = 0;
1840 $val = $1 if $str =~ /^(\d+)$/;
1842 if ($sel eq "y") {
1843 $interactive = 0;
1844 $done = 1;
1845 $output_rolestats = 0;
1846 $output_roles = 0;
1847 last;
1848 } elsif ($nr =~ /^\d+$/ && $nr > 0 && $nr <= $count) {
1849 $selected{$nr - 1} = !$selected{$nr - 1};
1850 } elsif ($sel eq "*" || $sel eq '^') {
1851 my $toggle = 0;
1852 $toggle = 1 if ($sel eq '*');
1853 for (my $i = 0; $i < $count; $i++) {
1854 $selected{$i} = $toggle;
1856 } elsif ($sel eq "0") {
1857 for (my $i = 0; $i < $count; $i++) {
1858 $selected{$i} = !$selected{$i};
1860 } elsif ($sel eq "t") {
1861 if (lc($str) eq "m") {
1862 for (my $i = 0; $i < $count; $i++) {
1863 $selected{$i} = !$selected{$i}
1864 if ($list[$i]->[1] =~ /^(maintainer|supporter)/i);
1866 } elsif (lc($str) eq "g") {
1867 for (my $i = 0; $i < $count; $i++) {
1868 $selected{$i} = !$selected{$i}
1869 if ($list[$i]->[1] =~ /^(author|commit|signer)/i);
1871 } elsif (lc($str) eq "l") {
1872 for (my $i = 0; $i < $count; $i++) {
1873 $selected{$i} = !$selected{$i}
1874 if ($list[$i]->[1] =~ /^(open list)/i);
1876 } elsif (lc($str) eq "s") {
1877 for (my $i = 0; $i < $count; $i++) {
1878 $selected{$i} = !$selected{$i}
1879 if ($list[$i]->[1] =~ /^(subscriber list)/i);
1882 } elsif ($sel eq "a") {
1883 if ($val > 0 && $val <= $count) {
1884 $authored{$val - 1} = !$authored{$val - 1};
1885 } elsif ($str eq '*' || $str eq '^') {
1886 my $toggle = 0;
1887 $toggle = 1 if ($str eq '*');
1888 for (my $i = 0; $i < $count; $i++) {
1889 $authored{$i} = $toggle;
1892 } elsif ($sel eq "s") {
1893 if ($val > 0 && $val <= $count) {
1894 $signed{$val - 1} = !$signed{$val - 1};
1895 } elsif ($str eq '*' || $str eq '^') {
1896 my $toggle = 0;
1897 $toggle = 1 if ($str eq '*');
1898 for (my $i = 0; $i < $count; $i++) {
1899 $signed{$i} = $toggle;
1902 } elsif ($sel eq "o") {
1903 $print_options = 1;
1904 $redraw = 1;
1905 } elsif ($sel eq "g") {
1906 if ($str eq "f") {
1907 bool_invert(\$email_git_fallback);
1908 } else {
1909 bool_invert(\$email_git);
1911 $rerun = 1;
1912 } elsif ($sel eq "b") {
1913 if ($str eq "s") {
1914 bool_invert(\$email_git_blame_signatures);
1915 } else {
1916 bool_invert(\$email_git_blame);
1918 $rerun = 1;
1919 } elsif ($sel eq "c") {
1920 if ($val > 0) {
1921 $email_git_min_signatures = $val;
1922 $rerun = 1;
1924 } elsif ($sel eq "x") {
1925 if ($val > 0) {
1926 $email_git_max_maintainers = $val;
1927 $rerun = 1;
1929 } elsif ($sel eq "%") {
1930 if ($str ne "" && $val >= 0) {
1931 $email_git_min_percent = $val;
1932 $rerun = 1;
1934 } elsif ($sel eq "d") {
1935 if (vcs_is_git()) {
1936 $email_git_since = $str;
1937 } elsif (vcs_is_hg()) {
1938 $email_hg_since = $str;
1940 $rerun = 1;
1941 } elsif ($sel eq "t") {
1942 bool_invert(\$email_git_all_signature_types);
1943 $rerun = 1;
1944 } elsif ($sel eq "f") {
1945 bool_invert(\$file_emails);
1946 $rerun = 1;
1947 } elsif ($sel eq "r") {
1948 bool_invert(\$email_remove_duplicates);
1949 $rerun = 1;
1950 } elsif ($sel eq "m") {
1951 bool_invert(\$email_use_mailmap);
1952 read_mailmap();
1953 $rerun = 1;
1954 } elsif ($sel eq "k") {
1955 bool_invert(\$keywords);
1956 $rerun = 1;
1957 } elsif ($sel eq "p") {
1958 if ($str ne "" && $val >= 0) {
1959 $pattern_depth = $val;
1960 $rerun = 1;
1962 } elsif ($sel eq "h" || $sel eq "?") {
1963 print STDERR <<EOT
1965 Interactive mode allows you to select the various maintainers, submitters,
1966 commit signers and mailing lists that could be CC'd on a patch.
1968 Any *'d entry is selected.
1970 If you have git or hg installed, you can choose to summarize the commit
1971 history of files in the patch. Also, each line of the current file can
1972 be matched to its commit author and that commits signers with blame.
1974 Various knobs exist to control the length of time for active commit
1975 tracking, the maximum number of commit authors and signers to add,
1976 and such.
1978 Enter selections at the prompt until you are satisfied that the selected
1979 maintainers are appropriate. You may enter multiple selections separated
1980 by either commas or spaces.
1983 } else {
1984 print STDERR "invalid option: '$nr'\n";
1985 $redraw = 0;
1988 if ($rerun) {
1989 print STDERR "git-blame can be very slow, please have patience..."
1990 if ($email_git_blame);
1991 goto &get_maintainers;
1995 #drop not selected entries
1996 $count = 0;
1997 my @new_emailto = ();
1998 foreach my $entry (@list) {
1999 if ($selected{$count}) {
2000 push(@new_emailto, $list[$count]);
2002 $count++;
2004 return @new_emailto;
2007 sub bool_invert {
2008 my ($bool_ref) = @_;
2010 if ($$bool_ref) {
2011 $$bool_ref = 0;
2012 } else {
2013 $$bool_ref = 1;
2017 sub deduplicate_email {
2018 my ($email) = @_;
2020 my $matched = 0;
2021 my ($name, $address) = parse_email($email);
2022 $email = format_email($name, $address, 1);
2023 $email = mailmap_email($email);
2025 return $email if (!$email_remove_duplicates);
2027 ($name, $address) = parse_email($email);
2029 if ($name ne "" && $deduplicate_name_hash{lc($name)}) {
2030 $name = $deduplicate_name_hash{lc($name)}->[0];
2031 $address = $deduplicate_name_hash{lc($name)}->[1];
2032 $matched = 1;
2033 } elsif ($deduplicate_address_hash{lc($address)}) {
2034 $name = $deduplicate_address_hash{lc($address)}->[0];
2035 $address = $deduplicate_address_hash{lc($address)}->[1];
2036 $matched = 1;
2038 if (!$matched) {
2039 $deduplicate_name_hash{lc($name)} = [ $name, $address ];
2040 $deduplicate_address_hash{lc($address)} = [ $name, $address ];
2042 $email = format_email($name, $address, 1);
2043 $email = mailmap_email($email);
2044 return $email;
2047 sub save_commits_by_author {
2048 my (@lines) = @_;
2050 my @authors = ();
2051 my @commits = ();
2052 my @subjects = ();
2054 foreach my $line (@lines) {
2055 if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
2056 my $author = $1;
2057 $author = deduplicate_email($author);
2058 push(@authors, $author);
2060 push(@commits, $1) if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
2061 push(@subjects, $1) if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
2064 for (my $i = 0; $i < @authors; $i++) {
2065 my $exists = 0;
2066 foreach my $ref(@{$commit_author_hash{$authors[$i]}}) {
2067 if (@{$ref}[0] eq $commits[$i] &&
2068 @{$ref}[1] eq $subjects[$i]) {
2069 $exists = 1;
2070 last;
2073 if (!$exists) {
2074 push(@{$commit_author_hash{$authors[$i]}},
2075 [ ($commits[$i], $subjects[$i]) ]);
2080 sub save_commits_by_signer {
2081 my (@lines) = @_;
2083 my $commit = "";
2084 my $subject = "";
2086 foreach my $line (@lines) {
2087 $commit = $1 if ($line =~ m/$VCS_cmds{"commit_pattern"}/);
2088 $subject = $1 if ($line =~ m/$VCS_cmds{"subject_pattern"}/);
2089 if ($line =~ /^[ \t]*${signature_pattern}.*\@.*$/) {
2090 my @signatures = ($line);
2091 my ($types_ref, $signers_ref) = extract_formatted_signatures(@signatures);
2092 my @types = @$types_ref;
2093 my @signers = @$signers_ref;
2095 my $type = $types[0];
2096 my $signer = $signers[0];
2098 $signer = deduplicate_email($signer);
2100 my $exists = 0;
2101 foreach my $ref(@{$commit_signer_hash{$signer}}) {
2102 if (@{$ref}[0] eq $commit &&
2103 @{$ref}[1] eq $subject &&
2104 @{$ref}[2] eq $type) {
2105 $exists = 1;
2106 last;
2109 if (!$exists) {
2110 push(@{$commit_signer_hash{$signer}},
2111 [ ($commit, $subject, $type) ]);
2117 sub vcs_assign {
2118 my ($role, $divisor, @lines) = @_;
2120 my %hash;
2121 my $count = 0;
2123 return if (@lines <= 0);
2125 if ($divisor <= 0) {
2126 warn("Bad divisor in " . (caller(0))[3] . ": $divisor\n");
2127 $divisor = 1;
2130 @lines = mailmap(@lines);
2132 return if (@lines <= 0);
2134 @lines = sort(@lines);
2136 # uniq -c
2137 $hash{$_}++ for @lines;
2139 # sort -rn
2140 foreach my $line (sort {$hash{$b} <=> $hash{$a}} keys %hash) {
2141 my $sign_offs = $hash{$line};
2142 my $percent = $sign_offs * 100 / $divisor;
2144 $percent = 100 if ($percent > 100);
2145 next if (ignore_email_address($line));
2146 $count++;
2147 last if ($sign_offs < $email_git_min_signatures ||
2148 $count > $email_git_max_maintainers ||
2149 $percent < $email_git_min_percent);
2150 push_email_address($line, '');
2151 if ($output_rolestats) {
2152 my $fmt_percent = sprintf("%.0f", $percent);
2153 add_role($line, "$role:$sign_offs/$divisor=$fmt_percent%");
2154 } else {
2155 add_role($line, $role);
2160 sub vcs_file_signoffs {
2161 my ($file) = @_;
2163 my $authors_ref;
2164 my $signers_ref;
2165 my $stats_ref;
2166 my @authors = ();
2167 my @signers = ();
2168 my @stats = ();
2169 my $commits;
2171 $vcs_used = vcs_exists();
2172 return if (!$vcs_used);
2174 my $cmd = $VCS_cmds{"find_signers_cmd"};
2175 $cmd =~ s/(\$\w+)/$1/eeg; # interpolate $cmd
2177 ($commits, $signers_ref, $authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2179 @signers = @{$signers_ref} if defined $signers_ref;
2180 @authors = @{$authors_ref} if defined $authors_ref;
2181 @stats = @{$stats_ref} if defined $stats_ref;
2183 # print("commits: <$commits>\nsigners:<@signers>\nauthors: <@authors>\nstats: <@stats>\n");
2185 foreach my $signer (@signers) {
2186 $signer = deduplicate_email($signer);
2189 vcs_assign("commit_signer", $commits, @signers);
2190 vcs_assign("authored", $commits, @authors);
2191 if ($#authors == $#stats) {
2192 my $stat_pattern = $VCS_cmds{"stat_pattern"};
2193 $stat_pattern =~ s/(\$\w+)/$1/eeg; #interpolate $stat_pattern
2195 my $added = 0;
2196 my $deleted = 0;
2197 for (my $i = 0; $i <= $#stats; $i++) {
2198 if ($stats[$i] =~ /$stat_pattern/) {
2199 $added += $1;
2200 $deleted += $2;
2203 my @tmp_authors = uniq(@authors);
2204 foreach my $author (@tmp_authors) {
2205 $author = deduplicate_email($author);
2207 @tmp_authors = uniq(@tmp_authors);
2208 my @list_added = ();
2209 my @list_deleted = ();
2210 foreach my $author (@tmp_authors) {
2211 my $auth_added = 0;
2212 my $auth_deleted = 0;
2213 for (my $i = 0; $i <= $#stats; $i++) {
2214 if ($author eq deduplicate_email($authors[$i]) &&
2215 $stats[$i] =~ /$stat_pattern/) {
2216 $auth_added += $1;
2217 $auth_deleted += $2;
2220 for (my $i = 0; $i < $auth_added; $i++) {
2221 push(@list_added, $author);
2223 for (my $i = 0; $i < $auth_deleted; $i++) {
2224 push(@list_deleted, $author);
2227 vcs_assign("added_lines", $added, @list_added);
2228 vcs_assign("removed_lines", $deleted, @list_deleted);
2232 sub vcs_file_blame {
2233 my ($file) = @_;
2235 my @signers = ();
2236 my @all_commits = ();
2237 my @commits = ();
2238 my $total_commits;
2239 my $total_lines;
2241 $vcs_used = vcs_exists();
2242 return if (!$vcs_used);
2244 @all_commits = vcs_blame($file);
2245 @commits = uniq(@all_commits);
2246 $total_commits = @commits;
2247 $total_lines = @all_commits;
2249 if ($email_git_blame_signatures) {
2250 if (vcs_is_hg()) {
2251 my $commit_count;
2252 my $commit_authors_ref;
2253 my $commit_signers_ref;
2254 my $stats_ref;
2255 my @commit_authors = ();
2256 my @commit_signers = ();
2257 my $commit = join(" -r ", @commits);
2258 my $cmd;
2260 $cmd = $VCS_cmds{"find_commit_signers_cmd"};
2261 $cmd =~ s/(\$\w+)/$1/eeg; #substitute variables in $cmd
2263 ($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2264 @commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
2265 @commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
2267 push(@signers, @commit_signers);
2268 } else {
2269 foreach my $commit (@commits) {
2270 my $commit_count;
2271 my $commit_authors_ref;
2272 my $commit_signers_ref;
2273 my $stats_ref;
2274 my @commit_authors = ();
2275 my @commit_signers = ();
2276 my $cmd;
2278 $cmd = $VCS_cmds{"find_commit_signers_cmd"};
2279 $cmd =~ s/(\$\w+)/$1/eeg; #substitute variables in $cmd
2281 ($commit_count, $commit_signers_ref, $commit_authors_ref, $stats_ref) = vcs_find_signers($cmd, $file);
2282 @commit_authors = @{$commit_authors_ref} if defined $commit_authors_ref;
2283 @commit_signers = @{$commit_signers_ref} if defined $commit_signers_ref;
2285 push(@signers, @commit_signers);
2290 if ($from_filename) {
2291 if ($output_rolestats) {
2292 my @blame_signers;
2293 if (vcs_is_hg()) {{ # Double brace for last exit
2294 my $commit_count;
2295 my @commit_signers = ();
2296 @commits = uniq(@commits);
2297 @commits = sort(@commits);
2298 my $commit = join(" -r ", @commits);
2299 my $cmd;
2301 $cmd = $VCS_cmds{"find_commit_author_cmd"};
2302 $cmd =~ s/(\$\w+)/$1/eeg; #substitute variables in $cmd
2304 my @lines = ();
2306 @lines = &{$VCS_cmds{"execute_cmd"}}($cmd);
2308 if (!$email_git_penguin_chiefs) {
2309 @lines = grep(!/${penguin_chiefs}/i, @lines);
2312 last if !@lines;
2314 my @authors = ();
2315 foreach my $line (@lines) {
2316 if ($line =~ m/$VCS_cmds{"author_pattern"}/) {
2317 my $author = $1;
2318 $author = deduplicate_email($author);
2319 push(@authors, $author);
2323 save_commits_by_author(@lines) if ($interactive);
2324 save_commits_by_signer(@lines) if ($interactive);
2326 push(@signers, @authors);
2328 else {
2329 foreach my $commit (@commits) {
2330 my $i;
2331 my $cmd = $VCS_cmds{"find_commit_author_cmd"};
2332 $cmd =~ s/(\$\w+)/$1/eeg; #interpolate $cmd
2333 my @author = vcs_find_author($cmd);
2334 next if !@author;
2336 my $formatted_author = deduplicate_email($author[0]);
2338 my $count = grep(/$commit/, @all_commits);
2339 for ($i = 0; $i < $count ; $i++) {
2340 push(@blame_signers, $formatted_author);
2344 if (@blame_signers) {
2345 vcs_assign("authored lines", $total_lines, @blame_signers);
2348 foreach my $signer (@signers) {
2349 $signer = deduplicate_email($signer);
2351 vcs_assign("commits", $total_commits, @signers);
2352 } else {
2353 foreach my $signer (@signers) {
2354 $signer = deduplicate_email($signer);
2356 vcs_assign("modified commits", $total_commits, @signers);
2360 sub vcs_file_exists {
2361 my ($file) = @_;
2363 my $exists;
2365 my $vcs_used = vcs_exists();
2366 return 0 if (!$vcs_used);
2368 my $cmd = $VCS_cmds{"file_exists_cmd"};
2369 $cmd =~ s/(\$\w+)/$1/eeg; # interpolate $cmd
2370 $cmd .= " 2>&1";
2371 $exists = &{$VCS_cmds{"execute_cmd"}}($cmd);
2373 return 0 if ($? != 0);
2375 return $exists;
2378 sub vcs_list_files {
2379 my ($file) = @_;
2381 my @lsfiles = ();
2383 my $vcs_used = vcs_exists();
2384 return 0 if (!$vcs_used);
2386 my $cmd = $VCS_cmds{"list_files_cmd"};
2387 $cmd =~ s/(\$\w+)/$1/eeg; # interpolate $cmd
2388 @lsfiles = &{$VCS_cmds{"execute_cmd"}}($cmd);
2390 return () if ($? != 0);
2392 return @lsfiles;
2395 sub uniq {
2396 my (@parms) = @_;
2398 my %saw;
2399 @parms = grep(!$saw{$_}++, @parms);
2400 return @parms;
2403 sub sort_and_uniq {
2404 my (@parms) = @_;
2406 my %saw;
2407 @parms = sort @parms;
2408 @parms = grep(!$saw{$_}++, @parms);
2409 return @parms;
2412 sub clean_file_emails {
2413 my (@file_emails) = @_;
2414 my @fmt_emails = ();
2416 foreach my $email (@file_emails) {
2417 $email =~ s/[\(\<\{]{0,1}([A-Za-z0-9_\.\+-]+\@[A-Za-z0-9\.-]+)[\)\>\}]{0,1}/\<$1\>/g;
2418 my ($name, $address) = parse_email($email);
2419 if ($name eq '"[,\.]"') {
2420 $name = "";
2423 my @nw = split(/[^A-Za-zÀ-ÿ\'\,\.\+-]/, $name);
2424 if (@nw > 2) {
2425 my $first = $nw[@nw - 3];
2426 my $middle = $nw[@nw - 2];
2427 my $last = $nw[@nw - 1];
2429 if (((length($first) == 1 && $first =~ m/[A-Za-z]/) ||
2430 (length($first) == 2 && substr($first, -1) eq ".")) ||
2431 (length($middle) == 1 ||
2432 (length($middle) == 2 && substr($middle, -1) eq "."))) {
2433 $name = "$first $middle $last";
2434 } else {
2435 $name = "$middle $last";
2439 if (substr($name, -1) =~ /[,\.]/) {
2440 $name = substr($name, 0, length($name) - 1);
2441 } elsif (substr($name, -2) =~ /[,\.]"/) {
2442 $name = substr($name, 0, length($name) - 2) . '"';
2445 if (substr($name, 0, 1) =~ /[,\.]/) {
2446 $name = substr($name, 1, length($name) - 1);
2447 } elsif (substr($name, 0, 2) =~ /"[,\.]/) {
2448 $name = '"' . substr($name, 2, length($name) - 2);
2451 my $fmt_email = format_email($name, $address, $email_usename);
2452 push(@fmt_emails, $fmt_email);
2454 return @fmt_emails;
2457 sub merge_email {
2458 my @lines;
2459 my %saw;
2461 for (@_) {
2462 my ($address, $role) = @$_;
2463 if (!$saw{$address}) {
2464 if ($output_roles) {
2465 push(@lines, "$address ($role)");
2466 } else {
2467 push(@lines, $address);
2469 $saw{$address} = 1;
2473 return @lines;
2476 sub output {
2477 my (@parms) = @_;
2479 if ($output_multiline) {
2480 foreach my $line (@parms) {
2481 print("${line}\n");
2483 } else {
2484 print(join($output_separator, @parms));
2485 print("\n");
2489 my $rfc822re;
2491 sub make_rfc822re {
2492 # Basic lexical tokens are specials, domain_literal, quoted_string, atom, and
2493 # comment. We must allow for rfc822_lwsp (or comments) after each of these.
2494 # This regexp will only work on addresses which have had comments stripped
2495 # and replaced with rfc822_lwsp.
2497 my $specials = '()<>@,;:\\\\".\\[\\]';
2498 my $controls = '\\000-\\037\\177';
2500 my $dtext = "[^\\[\\]\\r\\\\]";
2501 my $domain_literal = "\\[(?:$dtext|\\\\.)*\\]$rfc822_lwsp*";
2503 my $quoted_string = "\"(?:[^\\\"\\r\\\\]|\\\\.|$rfc822_lwsp)*\"$rfc822_lwsp*";
2505 # Use zero-width assertion to spot the limit of an atom. A simple
2506 # $rfc822_lwsp* causes the regexp engine to hang occasionally.
2507 my $atom = "[^$specials $controls]+(?:$rfc822_lwsp+|\\Z|(?=[\\[\"$specials]))";
2508 my $word = "(?:$atom|$quoted_string)";
2509 my $localpart = "$word(?:\\.$rfc822_lwsp*$word)*";
2511 my $sub_domain = "(?:$atom|$domain_literal)";
2512 my $domain = "$sub_domain(?:\\.$rfc822_lwsp*$sub_domain)*";
2514 my $addr_spec = "$localpart\@$rfc822_lwsp*$domain";
2516 my $phrase = "$word*";
2517 my $route = "(?:\@$domain(?:,\@$rfc822_lwsp*$domain)*:$rfc822_lwsp*)";
2518 my $route_addr = "\\<$rfc822_lwsp*$route?$addr_spec\\>$rfc822_lwsp*";
2519 my $mailbox = "(?:$addr_spec|$phrase$route_addr)";
2521 my $group = "$phrase:$rfc822_lwsp*(?:$mailbox(?:,\\s*$mailbox)*)?;\\s*";
2522 my $address = "(?:$mailbox|$group)";
2524 return "$rfc822_lwsp*$address";
2527 sub rfc822_strip_comments {
2528 my $s = shift;
2529 # Recursively remove comments, and replace with a single space. The simpler
2530 # regexps in the Email Addressing FAQ are imperfect - they will miss escaped
2531 # chars in atoms, for example.
2533 while ($s =~ s/^((?:[^"\\]|\\.)*
2534 (?:"(?:[^"\\]|\\.)*"(?:[^"\\]|\\.)*)*)
2535 \((?:[^()\\]|\\.)*\)/$1 /osx) {}
2536 return $s;
2539 # valid: returns true if the parameter is an RFC822 valid address
2541 sub rfc822_valid {
2542 my $s = rfc822_strip_comments(shift);
2544 if (!$rfc822re) {
2545 $rfc822re = make_rfc822re();
2548 return $s =~ m/^$rfc822re$/so && $s =~ m/^$rfc822_char*$/;
2551 # validlist: In scalar context, returns true if the parameter is an RFC822
2552 # valid list of addresses.
2554 # In list context, returns an empty list on failure (an invalid
2555 # address was found); otherwise a list whose first element is the
2556 # number of addresses found and whose remaining elements are the
2557 # addresses. This is needed to disambiguate failure (invalid)
2558 # from success with no addresses found, because an empty string is
2559 # a valid list.
2561 sub rfc822_validlist {
2562 my $s = rfc822_strip_comments(shift);
2564 if (!$rfc822re) {
2565 $rfc822re = make_rfc822re();
2567 # * null list items are valid according to the RFC
2568 # * the '1' business is to aid in distinguishing failure from no results
2570 my @r;
2571 if ($s =~ m/^(?:$rfc822re)?(?:,(?:$rfc822re)?)*$/so &&
2572 $s =~ m/^$rfc822_char*$/) {
2573 while ($s =~ m/(?:^|,$rfc822_lwsp*)($rfc822re)/gos) {
2574 push(@r, $1);
2576 return wantarray ? (scalar(@r), @r) : 1;
2578 return wantarray ? () : 0;