Part one of y2038 changes for Schwern
[p5sagit/p5-mst-13.2.git] / Porting / checkAUTHORS.pl
1 #!/usr/bin/perl -w
2 use strict;
3 use Text::Wrap;
4 $Text::Wrap::columns = 80;
5 my ($committer, $patch, $log);
6 use Getopt::Long;
7
8 my ($rank, $percentage, $cumulative, $reverse, $ta, @authors, %authors,
9     %untraced, %patchers, %committers);
10 my $result = GetOptions ("rank" => \$rank,                  # rank authors
11                          "thanks-applied" => \$ta,          # ranks committers
12                          "acknowledged=s"   => \@authors ,  # authors files
13                          "percentage" => \$percentage,      # show as %age
14                          "cumulative" => \$cumulative,
15                          "reverse" => \$reverse,
16                         );
17
18 if (!$result or (($rank||0) + ($ta||0) + (@authors ? 1 : 0) != 1) or !@ARGV) {
19   die <<"EOS";
20 $0 --rank Changelogs                        # rank authors by patches
21 $0 --acknowledged <authors file> Changelogs # Display unacknowledged authors
22 $0 --thanks-applied Changelogs              # ranks committers
23 $0 --percentage ...                         # show rankings as percentages
24 $0 --cumulative ...                         # show rankings cumulatively
25 $0 --reverse ...                            # show rankings in reverse
26 Specify stdin as - if needs be. Remember that option names can be abbreviated.
27 EOS
28 }
29
30
31 my $prev = "";
32 my %map;
33
34 while (<DATA>) {
35     chomp;
36     s/\\100/\@/g;
37     $_ = lc;
38     if (my ($correct, $alias) = /^\s*([^#\s]\S*)\s+(.*\S)/) {
39         if ($correct eq '+') {$correct = $prev} else {$prev = $correct}
40         $map {$alias} = $correct;
41     }
42 }
43
44 #
45 # Email addresses for we do not have names.
46 #
47 $map {$_} = "?" for 
48     "agrow\100thegotonerd.com",
49     "alexander_bluhm\100genua.de",
50     "alexander_gernler\100genua.de",
51     "ammon\100rhythm.com",
52     "bah\100longitude.com",
53     "bbucklan\100jpl-devvax.jpl.nasa.gov",
54     "ben\100linuxgazette.net",
55     "bilbo\100ua.fm",
56     "bob\100starlabs.net",
57     "bonefish\100cs.tu-berlin.de",
58     "bstrand\100switchmanagement.com",
59     "cygwin\100cygwin.com",
60     "david\100dhaller.de",
61     "dformosa\100dformosa.zeta.org.au",
62     "dgay\100acm.org",
63     "erik\100cs.uni-jena.de",
64     "glasser\100tang-eleven-seventy-nine.mit.edu",
65     "gml4410\100ggr.co.uk",
66     "grommel\100sears.com",
67     "ilya\100juil.nonet",
68     "info\100lingo.kiev.ua",
69     "jms\100mathras.comcast.net",
70     "johnh\100isi.edu",
71     "kan\100dcit.cz",
72     "kaminsky\100math.huji.ac.il",
73     "knew-p5p\100pimb.org",
74     "kvr\100centrum.cz",
75     "lemkemch\100t-online.de",
76     "mauzo\100csv.warwick.ac.uk",
77     "merijnb\100ms.com",
78     "mlelstv\100serpens.de",
79     "p.boven\100sara.nl",
80     "padre\100elte.hu",
81     "perlbug\100veggiechinese.net",
82     "pm\100capmon.dk",
83     "premchai21\100yahoo.com",
84     "pxm\100nubz.org",
85     "raf\100tradingpost.com.au",
86     "scott\100perlcode.org",
87     "smoketst\100hp46t243.cup.hp.com",
88     "yath-perlbug\100yath.de",
89 ;
90
91 #
92 # Email addresses for people that don't have an email address in AUTHORS
93 # Presumably deliberately?
94
95
96 $map {$_} = '!' for
97      # Nick Ing-Simmons has passed away (2006-09-25).
98      "nick\100ing-simmons.net",
99      "nik\100tiuk.ti.com",
100      "nick.ing-simmons\100elixent.com",
101
102      # Iain Truskett has passed away (2003-12-29).
103      "perl\100dellah.anu.edu.au",
104      "spoon\100dellah.org",
105      "spoon\100cpan.org",
106
107      # Ton Hospel
108      "me-02\100ton.iguana.be",
109      "perl-5.8.0\100ton.iguana.be",
110      "perl5-porters\100ton.iguana.be",
111
112      # Beau Cox
113      "beau\100beaucox.com",
114
115      # Randy W. Sims 
116      "ml-perl\100thepierianspring.org",
117
118      # Yuval Kogman
119      "nothingmuch\100woobling.org",
120
121 ;
122
123
124 if (@authors) {
125   my %raw;
126   foreach my $filename (@authors) {
127     open FH, "<$filename" or die "Can't open $filename: $!";
128     while (<FH>) {
129       next if /^\#/;
130       next if /^-- /;
131       if (/<([^>]+)>/) {
132         # Easy line.
133         $raw{$1}++;
134       } elsif (/^([-A-Za-z0-9 .\'À-ÖØöø-ÿ]+)[\t\n]/) {
135         # Name only
136         $untraced{$1}++;
137       } else {
138         chomp;
139         warn "Can't parse line '$_'";
140       }
141     }
142   }
143   foreach (keys %raw) {
144     print "E-mail $_ occurs $raw{$_} times\n" if $raw{$_} > 1;
145     $_ = lc $_;
146     $authors{$map{$_} || $_}++;
147   }
148   ++$authors{'!'};
149   ++$authors{'?'};
150 }
151
152 while (<>) {
153   next if /^-+/;
154   if (m!^\[\s+(\d+)\]\s+By:\s+(\S+)\s+on!) {
155     # new patch
156     my @new = ($1, $2);
157     &process ($committer, $patch, $log);
158     ($patch, $committer) = @new;
159     undef $log;
160   } elsif (s/^(\s+Log: )//) {
161     die "Duplicate Log:" if $log;
162     $log = $_;
163     my $prefix = " " x length $1;
164     LOG: while (<>) {
165       next if /^$/;
166       s/^\t/        /;
167       if (s/^$prefix//) {
168         $log .= $_;
169       } elsif (/^\s+Branch:/) {
170         last LOG;
171       } else {
172         chomp;
173         die "Malformed log end with '$_'";
174       }
175     }
176   }
177 }
178
179 &process ($committer, $patch, $log);
180
181 if ($rank) {
182   &display_ordered(\%patchers);
183 } elsif ($ta) {
184   &display_ordered(\%committers);
185 } elsif (%authors) {
186   my %missing;
187   foreach (sort keys %patchers) {
188     next if $authors{$_};
189     # Sort by number of patches, then name.
190     $missing{$patchers{$_}}->{$_}++;
191   }
192   foreach my $patches (sort {$b <=> $a} keys %missing) {
193     print "$patches patch(es)\n";
194     foreach my $author (sort keys %{$missing{$patches}}) {
195       print "  $author\n";
196     }
197   }
198 }
199
200 sub display_ordered {
201   my $what = shift;
202   my @sorted;
203   my $total;
204   while (my ($name, $count) = each %$what) {
205     push @{$sorted[$count]}, $name;
206     $total += $count;
207   }
208
209   my $i = @sorted;
210   return unless @sorted;
211   my $sum = 0;
212   foreach my $i ($reverse ? 0 .. $#sorted : reverse 0 .. $#sorted) {
213     next unless $sorted[$i];
214     my $prefix;
215     $sum += $i * @{$sorted[$i]};
216     # Value to display is either this one, or the cumulative sum.
217     my $value = $cumulative ? $sum : $i;
218     if ($percentage) {
219         $prefix = sprintf "%6.2f:\t", 100 * $value / $total;
220     } else {
221         $prefix = "$value:\t";
222     }
223     print wrap ($prefix, "\t", join (" ", sort @{$sorted[$i]}), "\n");
224   }
225 }
226
227 sub process {
228   my ($committer, $patch, $log) = @_;
229   return unless $committer;
230   my @authors = $log =~ /From:\s+.*?([^"\@ \t\n<>]+\@[^"\@ \t\n<>]+)/gm;
231
232   if (@authors) {
233     foreach (@authors) {
234       s/^<//;
235       s/>$//;
236       $_ = lc $_;
237       $patchers{$map{$_} || $_}++;
238     }
239     # print "$patch: @authors\n";
240     ++$committers{$committer};
241   } else {
242     # print "$patch: $committer\n";
243     # Not entirely fair as this means that the maint pumpking scores for
244     # everything intergrated that wasn't a third party patch in blead
245     $patchers{$committer}++;
246   }
247 }
248
249
250 __DATA__
251
252 #
253 # List of mappings. First entry the "correct" email address, as appears
254 # in the AUTHORS file. Second is any "alias" mapped to it.
255 #
256 # If the "correct" email address is a '+', the entry above is reused; 
257 # this for addresses with more than one alias.
258 #
259 # Note that all entries are in lowercase. Further, no '@' signs should
260 # appear; use \100 instead.
261 #
262 #
263 #  Committers.
264 #
265 adi                                     enache\100rdslink.ro
266 alanbur                                 alan.burlison\100sun.com
267 +                                       alan.burlison\100uk.sun.com
268 ams                                     ams\100wiw.org
269 chip                                    chip\100pobox.com
270 craigb                                  craig.berry\100psinetcs.com
271 +                                       craig.berry\100metamorgs.com
272 +                                       craig.berry\100signaltreesolutions.com
273 +                                       craigberry\100mac.com
274 +                                       craig.a.berry\100gmail.com
275 davem                                   davem\100fdgroup.com
276 +                                       davem\100iabyn.nospamdeletethisbit.com
277 +                                       davem\100iabyn.com
278 +                                       davem\100fdgroup.co.uk
279 +                                       davem\100fdisolutions.com
280 +                                       davem\100iabyn.com
281 demerphq                                demerphq\100gmail.com
282 +                                       yves.orton\100de.mci.com
283 +                                       yves.orton\100mciworldcom.de
284 doughera                                doughera\100lafayette.edu
285 gbarr                                   gbarr\100pobox.com
286 gisle                                   gisle\100activestate.com
287 +                                       gisle\100aas.no
288 gsar                                    gsar\100activestate.com
289 +                                       gsar\100cpan.org
290 hv                                      hv\100crypt.compulink.co.uk
291 +                                       hv\100crypt.org
292 jhi                                     jhi\100iki.fi
293 +                                       jhietaniemi\100gmail.com
294 +                                       jhi\100kosh.hut.fi
295 +                                       jhi\100cc.hut.fi
296 +                                       jarkko.hietaniemi\100nokia.com
297 merijn                                  h.m.brand\100xs4all.nl
298 +                                       h.m.brand\100hccnet.nl
299 +                                       merijn\100l1.procura.nl
300 mhx                                     mhx-perl\100gmx.net
301 nicholas                                nick\100unfortu.net
302 +                                       nick\100ccl4.org
303 +                                       nick\100talking.bollo.cx
304 +                                       nick\100plum.flirble.org
305 +                                       nick\100babyhippo.co.uk
306 +                                       nick\100bagpuss.unfortu.net
307 pudge                                   pudge\100pobox.com
308 rgs                                     rgarciasuarez\100free.fr
309 +                                       rgarciasuarez\100mandrakesoft.com
310 +                                       rgarciasuarez\100mandriva.com
311 +                                       rgarciasuarez\100gmail.com
312 +                                       raphel.garcia-suarez\100hexaflux.com
313 sky                                     sky\100nanisky.com
314 +                                       artur\100contiller.se
315 +                                       arthur\100contiller.se
316 steveh                                  stevehay\100planit.com
317 +                                       steve.hay\100uk.radan.com
318 stevep                                  steve\100fisharerojo.org
319 +                                       steve.peters\100gmail.com
320
321 #
322 # Mere mortals.
323 #
324 7k8lrvf02\100sneakemail.com             kjx9zthh3001\100sneakemail.com
325 +                                       dtr8sin02\100sneakemail.com
326 +                                       rt8363b02\100sneakemail.com
327 +                                       o6hhmk002\100sneakemail.com
328 +                                       smueller\100cpan.org
329 +                                       l2ot9pa02\100sneakemail.com
330 +                                       wyp3rlx02\100sneakemail.com
331
332 abe\100ztreet.demon.nl                  abeltje\100cpan.org
333 abigail\100abigail.be                   abigail\100foad.org
334 +                                       abigail\100abigail.nl
335 ajohnson\100nvidia.com                  ajohnson\100wischip.com
336 alexm\100netli.com                      alexm\100w-m.ru
337 alex-p5p\100earth.li                    alex\100rcon.rog
338 alian\100cpan.org                       alian\100alianwebserver.com
339 allens\100cpan.org                      easmith\100beatrice.rutgers.edu
340 andreas.koenig\100anima.de        andreas.koenig.gmwojprw\100franz.ak.mind.de
341 +                                 andreas.koenig.7os6vvqr\100franz.ak.mind.de
342 +                                       a.koenig\100mind.de
343 anno4000\100lublin.zrz.tu-berlin.de     anno4000\100mailbox.tu-berlin.de
344 +                                       siegel\100zrz.tu-berlin.de
345 ash\100cpan.org                         ash_cpan\100firemirror.com
346 avarab\100gmail.com                     avar\100cpan.org
347
348 bah\100ecnvantage.com                   bholzman\100longitude.com
349 bcarter@gumdrop.flyinganvil.org         q.eibcartereio.=~m-b.{6}-cgimosx@gumdrop.flyinganvil.org
350 ben_tilly\100operamail.com              btilly\100gmail.com
351
352 chromatic\100wgz.org                    chromatic\100rmci.net
353 clkao\100clkao.org                      clkao\100bestpractical.com
354 cp\100onsitetech.com                    publiustemp-p5p\100yahoo.com
355 +                                       publiustemp-p5p3\100yahoo.com
356 cpan\100audreyt.org                     autrijus\100egb.elixus.org
357 +                                       autrijus\100geb.elixus.org
358 +                                       autrijus\100gmail.com
359 +                                       autrijus\100ossf.iis.sinica.edu.tw
360 +                                       autrijus\100autrijus.org
361 +                                       audreyt\100audreyt.org
362
363 damian\100cs.monash.edu.au              damian\100conway.org
364 david.dyck\100fluke.com                 dcd\100tc.fluke.com
365 demerphq\100gmail.com                   demerphq\100hotmail.com
366 domo\100computer.org                    shouldbedomo\100mac.com
367
368 epeschko\100den-mdev1                   esp5\100pge.com
369
370 fugazi\100zyx.net                       larrysh\100cpan.org
371
372 gellyfish\100gellyfish.com              jns\100gellyfish.com
373 gp\100familiehaase.de                   gerrit\100familiehaase.de
374 grazz\100pobox.com                      grazz\100nyc.rr.com
375
376 hio\100ymir.co.jp                       hio\100hio.jp
377
378 japhy\100pobox.com                      japhy\100pobox.org
379 +                                       japhy\100perlmonk.org
380 +                                       japhy\100cpan.org
381 jari.aalto\100poboxes.com               jari.aalto\100cante.net
382 jcromie\100divsol.com                   jcromie\100cpan.org
383 +                                       jim.cromie\100gmail.com
384 jdhedden\100cpan.org                    jerry\100hedden.us
385 +                                       jdhedden\1001979.usna.com
386 +                                       jdhedden\100gmail.com
387 +                                       jdhedden\100yahoo.com
388 jfriedl\100yahoo.com                    jfriedl\100yahoo-inc.com
389 jjore\100cpan.org                       twists\100gmail.com
390 juerd\100cpan.org                       juerd\100convolution.nl
391
392 kane\100dwim.org                        kane\100xs4all.net
393 +                                       kane\100cpan.org
394 +                                       kane\100xs4all.nl
395 +                                       jos\100dwim.org
396 +                                       jib\100ripe.net
397 kroepke\100dolphin-services.de          kay\100dolphin-services.de
398 kstar\100wolfetech.com                  kstar\100cpan.org
399
400 mats\100sm6sxl.net                      mats\100sm5sxl.net
401 mbarbon\100dsi.unive.it                 mattia.barbon\100libero.it
402 mcmahon\100ibiblio.org                  mcmahon\100metalab.unc.edu
403 merijnb\100iloquent.nl                  merijnb\100iloquent.com
404 mgjv\100comdyn.com.au                   mgjv\100tradingpost.com.au
405 michael.schroeder\100informatik.uni-erlangen.de mls\100suse.de
406 mike\100stok.co.uk                      mike\100exegenix.com
407 mjtg\100cam.ac.uk                       mjtg\100cus.cam.ac.uk
408
409 nospam-abuse\100bloodgate.com           tels\100bloodgate.com
410 +                                       perl_dummy\100bloodgate.com
411 ilya\100math.berkeley.edu               ilya\100math.ohio-state.edu
412 +                                       nospam-abuse\100ilyaz.org
413
414 p5-authors\100crystalflame.net          perl\100crystalflame.net
415 +                                       rs\100crystalflame.net
416 paul.green\100stratus.com               paul_greenvos\100vos.stratus.com
417 paul.marquess\100btinternet.com         paul_marquess\100yahoo.co.uk
418 +                                       paul.marquess\100ntlworld.com
419 +                                       paul.marquess\100openwave.com
420 pcg\100goof.com                         schmorp\100schmorp.de
421 # Maybe we should special case this to get real names out?
422 perlbug\100perl.org                     perlbug-followup\100perl.org
423 +                                       bugs-perl5\100bugs6.perl.org
424 phil\100perkpartners.com                phil\100finchcomputer.com
425 pimlott\100idiomtech.com                andrew\100pimlott.net
426 pne\100cpan.org                         philip.newton\100gmx.net
427 +                                       philip.newton\100datenrevision.de
428 +                                       pnewton\100gmx.de
429
430 radu\100netsoft.ro                      rgreab\100fx.ro
431 richard.foley\100ubsw.com               richard.foley\100t-online.de
432 +                                       richard.foley\100ubs.com
433 +                                       richard.foley\100rfi.net
434 rick\100consumercontact.com             rick\100bort.ca
435 +                                       rick.delaney\100rogers.com
436 +                                       rick\100bort.ca
437 rjbs\100cpan.org                        rjbs-perl-p5p\100lists.manxome.org
438 rjk\100linguist.dartmouth.edu           rjk\100linguist.thayer.dartmouth.edu
439 +                                       rjk-perl-p5p\100tamias.net
440 rmgiroux\100acm.org                     rmgiroux\100hotmail.com
441 rmbarker\100cpan.org                    rmb1\100cise.npl.co.uk
442 +                                       robin.barker\100npl.co.uk
443 rootbeer\100teleport.com                rootbeer\100redcat.com
444
445 schubiger\100cpan.org                   steven\100accognoscere.org
446 +                                       sts\100accognoscere.org
447 schwern\100pobox.com                    schwern\100gmail.com
448 +                                       schwern\100athens.arena-i.com
449 +                                       schwern\100blackrider.aocn.com
450 +                                       schwern\100ool-18b93024.dyn.optonline.net
451 sebastien\100aperghis.net               maddingue\100free.fr
452 +                                       saper\100cpan.org
453 simon\100simon-cozens.org               simon\100pembro4.pmb.ox.ac.uk
454 +                                       simon\100brecon.co.uk
455 +                                       simon\100othersideofthe.earth.li
456 +                                       simon\100cozens.net
457 +                                       simon\100netthink.co.uk
458 slaven\100rezic.de                      slaven.rezic\100berlin.de
459 +                                       srezic\100iconmobile.com
460 smcc\100mit.edu                         smcc\100ocf.berkeley.edu
461 +                                       smcc\100csua.berkeley.edu
462 spider\100orb.nashua.nh.us              spider\100web.zk3.dec.com
463 +                                       spider\100leggy.zk3.dec.com
464 +                                       spider-perl\100orb.nashua.nh.us
465 +                                       spider\100peano.zk3.dec.com
466 stef\100mongueurs.net                   stef\100payrard.net
467 +                                       s.payrard\100wanadoo.fr
468
469 tassilo.parseval\100post.rwth-aachen.de tassilo.von.parseval\100rwth-aachen.de
470 thomas.dorner\100start.de               tdorner\100amadeus.net
471 tjenness\100cpan.org                    t.jenness\100jach.hawaii.edu
472 +                                       timj\100jach.hawaii.edu
473 tom.horsley\100mail.ccur.com            tom.horsley\100ccur.com
474
475 vkonovalov\100lucent.com                vkonovalov\100peterstar.ru
476 +                                       konovalo\100mail.wplus.net
477 +                                       vadim\100vkonovalov.ru
478 +                                       vkonovalov\100spb.lucent.com
479 +                                       vkonovalov\100alcatel-lucent.com
480
481 whatever\100davidnicol.com              davidnicol\100gmail.com
482 wolfgang.laun\100alcatel.at             wolfgang.laun\100chello.at
483 +                                       wolfgang.laun\100thalesgroup.com
484 +                                       wolfgang.laun\100gmail.com