checkAUTHORS.pl again
[p5sagit/p5-mst-13.2.git] / Porting / checkAUTHORS.pl
CommitLineData
5649b9c9 1#!/usr/bin/perl -w
2use strict;
3use Text::Wrap;
4$Text::Wrap::columns = 80;
5my ($committer, $patch, $log);
6use Getopt::Long;
7
2b0ba25f 8my ($rank, $percentage, $cumulative, $reverse, $ta, @authors, %authors,
9 %untraced, %patchers, %committers);
ff4d71b5 10my $result = GetOptions ("rank" => \$rank, # rank authors
11 "thanks-applied" => \$ta, # ranks committers
15b8f96d 12 "acknowledged=s" => \@authors , # authors files
13 "percentage" => \$percentage, # show as %age
2b0ba25f 14 "cumulative" => \$cumulative,
15 "reverse" => \$reverse,
15b8f96d 16 );
5649b9c9 17
ff4d71b5 18if (!$result or (($rank||0) + ($ta||0) + (@authors ? 1 : 0) != 1) or !@ARGV) {
5649b9c9 19 die <<"EOS";
20$0 --rank Changelogs # rank authors by patches
21$0 --acknowledged <authors file> Changelogs # Display unacknowledged authors
ff4d71b5 22$0 --thanks-applied Changelogs # ranks committers
15b8f96d 23$0 --percentage ... # show rankings as percentages
2b0ba25f 24$0 --cumulative ... # show rankings cumulatively
25$0 --reverse ... # show rankings in reverse
5649b9c9 26Specify stdin as - if needs be. Remember that option names can be abbreviated.
27EOS
28}
29
30my %map = reverse (
31 # "Correct" => "Alias"
32 adi => "enache\100rdslink.ro",
33 alanbur => "alan.burlison\100sun.com",
34 ams => "ams\100wiw.org",
35 chip => "chip\100pobox.com",
36 davem => "davem\100fdgroup.com",
37 doughera => " doughera\100lafayette.edu",
38 gbarr => "gbarr\100pobox.com",
39 gsar => "gsar\100activestate.com",
40 hv => "hv\100crypt.compulink.co.uk",
41 jhi => "jhi\100iki.fi",
3bd76f0a 42 merijn => "h.m.brand\100xs4all.nl",
5649b9c9 43 mhx => "mhx-perl\100gmx.net",
44 nicholas => "nick\100unfortu.net",
45 nick => "nick\100ing-simmons.net",
46 pudge => "pudge\100pobox.com",
47 rgs => "rgarciasuarez\100free.fr",
48 sky => "sky\100nanisky.com",
5e266217 49 steveh => "steve.hay\100uk.radan.com",
50 stevep => "steve\100fisharerojo.org",
a7ad7795 51 gisle => "gisle\100activestate.com",
5649b9c9 52 "abigail\100abigail.nl"=> "abigail\100foad.org",
53 "chromatic\100wgz.org" => "chromatic\100rmci.net",
54 "slaven\100rezic.de" => "slaven.rezic\100berlin.de",
55 "mjtg\100cam.ac.uk" => "mjtg\100cus.cam.ac.uk",
56 "robin.barker\100npl.co.uk" => "rmb1\100cise.npl.co.uk",
57 "paul.marquess\100btinternet.com"
58 => "paul_marquess\100yahoo.co.uk",
59 "wolfgang.laun\100chello.at" =>
60 "wolfgang.laun\100alcatel.at",
61 "t.jenness\100jach.hawaii.edu" => "timj\100jach.hawaii.edu",
62 "abe\100ztreet.demon.nl" => "abeltje\100cpan.org",
a7ad7795 63 "nospam-abuse\100bloodgate.com" => "tels\100bloodgate.com",
5649b9c9 64 "jfriedl\100yahoo.com" => "jfriedl\100yahoo-inc.com",
65 "japhy\100pobox.com" => "japhy\100pobox.org",
66 "gellyfish\100gellyfish.com" => "jns\100gellyfish.com",
a7ad7795 67 "jcromie\100divsol.com" => "jcromie\100cpan.org",
68 "demerphq\100gmail.com" => "demerphq\100hotmail.com",
69 "rick\100consumercontact.com" => "rick\100bort.ca",
70 "vkonovalov\100spb.lucent.com"
71 => "vkonovalov\100peterstar.ru",
72 "rjk\100linguist.dartmouth.edu"
73 => "rjk\100linguist.thayer.dartmouth.edu",
74 "domo\100computer.org" => "shouldbedomo\100mac.com",
75 "kane\100dwim.org" => "kane\100xs4all.net",
76 "allens\100cpan.org" => "easmith\100beatrice.rutgers.edu",
77 "spoon\100cpan.org" => "spoon\100dellah.org",
657b1971 78 "ben_tilly\100operamail.com" => "btilly\100gmail.com",
79 "mbarbon\100dsi.unive.it" => "mattia.barbon\100libero.it",
80 "tassilo.parseval\100post.rwth-aachen.de" =>
81 "tassilo.von.parseval\100rwth-aachen.de",
82 "dcd\100tc.fluke.com" => "david.dyck\100fluke.com",
83 "kroepke\100dolphin-services.de"
84 => "kay\100dolphin-services.de",
85 "sebastien\100aperghis.net" => "maddingue\100free.fr",
86 "radu\100netsoft.ro" => "rgreab\100fx.ro",
87 "rick\100consumercontact.com"
88 => "rick.delaney\100rogers.com",
89 "p5-authors\100crystalflame.net"
90 => "perl\100crystalflame.net",
91 "stef\100mongueurs.net" => "stef\100payrard.net",
18f651c1 92 "kstar\100wolfetech.com" => "kstar\100cpan.org",
93 "7k8lrvf02\100sneakemail.com" =>
94 "kjx9zthh3001\100sneakemail.com",
95 "mgjv\100comdyn.com.au" => "mgjv\100tradingpost.com.au",
96 "thomas.dorner\100start.de" => "tdorner\100amadeus.net",
97 "ajohnson\100nvidia.com" => "ajohnson\100wischip.com",
5f9c001d 98 "phil\100perkpartners.com" => "phil\100finchcomputer.com",
39243be7 99 "tom.horsley\100mail.ccur.com" => "tom.horsley\100ccur.com",
100 "rootbeer\100teleport.com" => "rootbeer\100redcat.com",
101 "cp\100onsitetech.com" => "publiustemp-p5p\100yahoo.com",
102 "epeschko\100den-mdev1" => "esp5\100pge.com",
103 "pimlott\100idiomtech.com" => "andrew\100pimlott.net",
104 "fugazi\100zyx.net" => "larrysh\100cpan.org",
105 "merijnb\100iloquent.nl" => "merijnb\100iloquent.com",
106 "whatever\100davidnicol.com" => "davidnicol\100gmail.com",
107 "rmgiroux\100acm.org" => "rmgiroux\100hotmail.com",
108 "smcc\100mit.edu" => "smcc\100ocf.berkeley.edu",
0ad39044 109 "schubiger\100cpan.org" => "steven\100accognoscere.org",
2b90724c 110 "richard.foley\100ubsw.com"
111 => "richard.foley\100t-online.de",
112 "damian\100cs.monash.edu.au" => "damian\100conway.org",
113 "gp\100familiehaase.de" => "gerrit\100familiehaase.de",
114 "juerd\100cpan.org" => "juerd\100convolution.nl",
115 "paul.green\100stratus.com"
116 => "paul_greenvos\100vos.stratus.com",
117 "alian\100cpan.org" => "alian\100alianwebserver.com",
bf607fdc 118 "david.dyck\100fluke.com" => "dcd\100tc.fluke.com",
5e71429c 119 "jdhedden\100" . "1979.usna.com" => "jdhedden\100cpan.org",
a7ad7795 120 # Maybe we should special case this to get real names out?
121 "perlbug\100perl.org" => "perlbug-followup\100perl.org",
5649b9c9 122 );
123
124# Make sure these are all lower case.
125
5649b9c9 126$map{"autrijus\100egb.elixus.org"} = $map{"autrijus\100geb.elixus.org"}
2b90724c 127 = $map{"autrijus\100gmail.com"} = $map{"autrijus\100ossf.iis.sinica.edu.tw"}
4d8e9145 128 = $map{"autrijus\100autrijus.org"} = "cpan\100audreyt.org";
5649b9c9 129$map{"ilya\100math.ohio-state.edu"} = $map{"ilya\100math.berkeley.edu"}
130 = $map{"ilya\100math.berkeley.edu"} = "nospam-abuse\100ilyaz.org";
5649b9c9 131$map{"philip.newton\100gmx.net"} = $map{"philip.newton\100datenrevision.de"}
a7ad7795 132 = $map{"pnewton\100gmx.de"} = "pne\100cpan.org",
5649b9c9 133$map{"simon\100pembro4.pmb.ox.ac.uk"} = $map{"simon\100brecon.co.uk"}
134 = $map{"simon\100othersideofthe.earth.li"} = $map{"simon\100cozens.net"}
135 = $map{"simon\100netthink.co.uk"} = "simon\100simon-cozens.org";
136$map{"spider\100web.zk3.dec.com"} = $map{"spider\100leggy.zk3.dec.com"}
137 = $map{"spider-perl\100orb.nashua.nh.us"}
138 = $map{"spider\100peano.zk3.dec.com"}
139 = "spider\100orb.nashua.nh.us";
2b90724c 140$map{"andreas.koenig.gmwojprw\100franz.ak.mind.de"}
141 = $map{"a.koenig\100mind.de"} = "andreas.koenig\100anima.de";
5649b9c9 142$map{"japhy\100perlmonk.org"} = $map{"japhy\100cpan.org"}
143 = "japhy\100pobox.com";
144$map{"rmbarker\100cpan.org"} = "robin.barker\100npl.co.uk";
a7ad7795 145$map{"yves.orton\100de.mci.com"} = $map{"yves.orton\100mciworldcom.de"}
657b1971 146 = "demerphq\100gmail.com";
a7ad7795 147$map{"jim.cromie\100gmail.com"} = "jcromie\100divsol.com";
148$map{"perl_dummy\100bloodgate.com"} = "nospam-abuse\100bloodgate.com";
149$map{"paul.marquess\100ntlworld.com"} = "paul.marquess\100btinternet.com";
657b1971 150$map{"konovalo\100mail.wplus.net"} = $map{"vadim\100vkonovalov.ru"}
151 = "vkonovalov\100spb.lucent.com";
152$map{"kane\100cpan.org"} = "kane\100dwim.org";
153$map{"rs\100crystalflame.net"} = "p5-authors\100crystalflame.net";
18f651c1 154$map{"(srezic\100iconmobile.com)"} = "slaven\100rezic.de";
155$map{"perl\100dellah.anu.edu.au"} = "spoon\100cpan.org";
39243be7 156$map{"rjk-perl-p5p\100tamias.net"} = "rjk\100linguist.dartmouth.edu";
0ad39044 157$map{"sts\100accognoscere.org"} = "schubiger\100cpan.org";
6fbb3cd3 158$map{"s.payrard\100wanadoo.fr"} = "stef\100mongueurs.net";
2b90724c 159$map{"richard.foley\100ubs.com"} = "richard.foley\100ubsw.com";
c0707526 160$map{"jerry\100hedden.us"} = $map{"jdhedden\100" . "1979.usna.com"} =
161$map{"jdhedden\100gmail.com"} = $map{"jdhedden\100yahoo.com"}
162 = "jdhedden\100cpan.org";
2b90724c 163# I assume that Ton Hopsel's lack of e-mail address in AUTHORS is deliberate
164$map{"me-02\100ton.iguana.be"} = $map{"perl-5.8.0\100ton.iguana.be"}
165 = $map{"perl5-porters\100ton.iguana.be"} = "!";
166# No real name for these address
167$map{$_} = "?" foreach ("grommel\100sears.com", "pxm\100nubz.org",
5e71429c 168 "padre\100elte.hu",
2b90724c 169 "nothingmuch\100woobling.org", "bob\100starlabs.net",
170 "bbucklan\100jpl-devvax.jpl.nasa.gov",
171 "bilbo\100ua.fm", "mats\100sm5sxl.net",
172 "chris\100ex-parrot.com",
173 "kaminsky\100math.huji.ac.il",
174 "bonefish\100cs.tu-berlin.de",
175 "bstrand\100switchmanagement.com",
176 "glasser\100tang-eleven-seventy-nine.mit.edu",
177 "raf\100tradingpost.com.au", "erik\100cs.uni-jena.de",
178 "jms\100mathras.comcast.net", "kvr\100centrum.cz",
179 "perlbug\100veggiechinese.net",
180 "scott\100perlcode.org",
181 );
182# We don't have an e-mail address for Beau Cox
183$map{"beau\100beaucox.com"} = "?";
6fbb3cd3 184
185$map{"rgarciasuarez\100mandrakesoft.com"}
186 = $map{"rgarciasuarez\100mandriva.com"}
f5adfaf5 187 = $map{"rgarciasuarez\100gmail.com"}
6fbb3cd3 188 = $map{"raphel.garcia-suarez\100hexaflux.com"} = "rgs";
189$map{"jhietaniemi\100gmail.com"} = $map{"jhi\100kosh.hut.fi"}
2b90724c 190 = $map{"jhi\100cc.hut.fi"} = $map{"jarkko.hietaniemi\100nokia.com"} = "jhi";
6fbb3cd3 191$map{"nick\100ccl4.org"} = $map{"nick\100talking.bollo.cx"}
192 = $map{"nick\100plum.flirble.org"} = $map{"nick\100babyhippo.co.uk"}
193 = $map{"nick\100bagpuss.unfortu.net"} = "nicholas";
194$map{"craig.berry\100psinetcs.com"} = $map{"craig.berry\100metamorgs.com"}
195 = $map{"craig.berry\100signaltreesolutions.com"}
196 = $map{"craigberry\100mac.com"} = "craigb";
197$map{"davem\100iabyn.nospamdeletethisbit.com" }
2b90724c 198 = $map{"davem\100fdgroup.co.uk"} = $map{"davem\100fdisolutions.com"}
199 = "davem";
6fbb3cd3 200$map{"alan.burlison\100uk.sun.com"} = "alanbur";
201$map{"artur\100contiller.se"} = $map{"arthur\100contiller.se"} = "sky";
202$map{"h.m.brand\100hccnet.nl"} = $map{"merijn\100l1.procura.nl"} = "merijn";
2b90724c 203$map{"nik\100tiuk.ti.com"} = $map{"nick.ing-simmons\100elixent.com"} = "nick";
a7ad7795 204$map{"hv\100crypt.org"} = "hv";
205$map{"gisle\100aas.no"} = "gisle";
9d5e8f04 206$map{"gsar\100cpan.org"} = "gsar";
a7ad7795 207
5649b9c9 208if (@authors) {
209 my %raw;
210 foreach my $filename (@authors) {
211 open FH, "<$filename" or die "Can't open $filename: $!";
212 while (<FH>) {
213 next if /^\#/;
214 next if /^-- /;
215 if (/<([^>]+)>/) {
216 # Easy line.
217 $raw{$1}++;
218 } elsif (/^([-A-Za-z0-9 .\'À-ÖØöø-ÿ]+)[\t\n]/) {
219 # Name only
220 $untraced{$1}++;
221 } else {
222 chomp;
223 warn "Can't parse line '$_'";
224 }
225 }
226 }
227 foreach (keys %raw) {
228 print "E-mail $_ occurs $raw{$_} times\n" if $raw{$_} > 1;
229 $_ = lc $_;
230 $authors{$map{$_} || $_}++;
231 }
2b90724c 232 ++$authors{'!'};
233 ++$authors{'?'};
5649b9c9 234}
235
236while (<>) {
237 next if /^-+/;
238 if (m!^\[\s+(\d+)\]\s+By:\s+(\S+)\s+on!) {
239 # new patch
240 my @new = ($1, $2);
241 &process ($committer, $patch, $log);
242 ($patch, $committer) = @new;
243 undef $log;
244 } elsif (s/^(\s+Log: )//) {
245 die "Duplicate Log:" if $log;
246 $log = $_;
247 my $prefix = " " x length $1;
248 LOG: while (<>) {
84fd1186 249 next if /^$/;
bdb5e10e 250 s/^\t/ /;
5649b9c9 251 if (s/^$prefix//) {
252 $log .= $_;
253 } elsif (/^\s+Branch:/) {
254 last LOG;
255 } else {
84fd1186 256 chomp;
257 die "Malformed log end with '$_'";
5649b9c9 258 }
259 }
260 }
261}
262
263&process ($committer, $patch, $log);
264
265if ($rank) {
ff4d71b5 266 &display_ordered(\%patchers);
267} elsif ($ta) {
268 &display_ordered(\%committers);
5649b9c9 269} elsif (%authors) {
270 my %missing;
271 foreach (sort keys %patchers) {
272 next if $authors{$_};
273 # Sort by number of patches, then name.
274 $missing{$patchers{$_}}->{$_}++;
275 }
276 foreach my $patches (sort {$b <=> $a} keys %missing) {
277 print "$patches patch(es)\n";
278 foreach my $author (sort keys %{$missing{$patches}}) {
279 print " $author\n";
280 }
281 }
282}
283
284sub display_ordered {
ff4d71b5 285 my $what = shift;
5649b9c9 286 my @sorted;
15b8f96d 287 my $total;
ff4d71b5 288 while (my ($name, $count) = each %$what) {
5649b9c9 289 push @{$sorted[$count]}, $name;
15b8f96d 290 $total += $count;
5649b9c9 291 }
292
293 my $i = @sorted;
2b0ba25f 294 return unless @sorted;
295 my $sum = 0;
296 foreach my $i ($reverse ? 0 .. $#sorted : reverse 0 .. $#sorted) {
5649b9c9 297 next unless $sorted[$i];
15b8f96d 298 my $prefix;
2b0ba25f 299 $sum += $i * @{$sorted[$i]};
300 # Value to display is either this one, or the cumulative sum.
301 my $value = $cumulative ? $sum : $i;
15b8f96d 302 if ($percentage) {
2b0ba25f 303 $prefix = sprintf "%6.2f:\t", 100 * $value / $total;
15b8f96d 304 } else {
2b0ba25f 305 $prefix = "$value:\t";
15b8f96d 306 }
307 print wrap ($prefix, "\t", join (" ", sort @{$sorted[$i]}), "\n");
5649b9c9 308 }
309}
310
311sub process {
312 my ($committer, $patch, $log) = @_;
313 return unless $committer;
2b90724c 314 my @authors = $log =~ /From:\s+.*?([^"\@ \t\n<>]+\@[^"\@ \t\n<>]+)/gm;
5649b9c9 315
316 if (@authors) {
317 foreach (@authors) {
318 s/^<//;
319 s/>$//;
320 $_ = lc $_;
321 $patchers{$map{$_} || $_}++;
322 }
323 # print "$patch: @authors\n";
ff4d71b5 324 ++$committers{$committer};
5649b9c9 325 } else {
326 # print "$patch: $committer\n";
327 # Not entirely fair as this means that the maint pumpking scores for
328 # everything intergrated that wasn't a third party patch in blead
329 $patchers{$committer}++;
330 }
331}
332
333