From: tla Date: Tue, 13 Aug 2013 11:38:17 +0000 (+0200) Subject: Get rid of 'sic' notation in readings X-Git-Url: http://git.shadowcat.co.uk/gitweb/gitweb.cgi?a=commitdiff_plain;h=b2edc51f76a3f6aac591cfa9533d9fab61c20480;p=scpubgit%2Fstemmatology.git Get rid of 'sic' notation in readings --- diff --git a/base/lib/Text/Tradition/Parser/CTE.pm b/base/lib/Text/Tradition/Parser/CTE.pm index 6180821..2926a4a 100644 --- a/base/lib/Text/Tradition/Parser/CTE.pm +++ b/base/lib/Text/Tradition/Parser/CTE.pm @@ -363,7 +363,7 @@ sub interpret { # $lemma =~ s/\s+[[:punct:]]+$//; my $flag; # In case of p.c. indications my @words = split( /\s+/, $lemma ); - $reading =~ s/[[:punct:]]?\bsic\b[[:punct:]]?//g; + $reading =~ s/[[:punct:]]?\bsic\b([[:punct:]]+)?//g; if( $reading =~ /^(.*) praem.$/ ) { $reading = "$1 $lemma"; } elsif( $reading =~ /^(.*) add.$/ ) { @@ -395,9 +395,6 @@ sub interpret { # There was nothing before a correction. $reading = ''; $flag = '_ac'; - } elsif( $reading =~ /^(.*?)\s*\(?sic([\s\w!.]+)?\)?$/ ) { - # Discard any 'sic' notation; indeed, indeed. - $reading = $1; } elsif( $reading =~ /^(.*) \.\.\. (.*)$/ ) { # The first and last N words captured should replace the first and # last N words of the lemma.