X-Git-Url: http://git.shadowcat.co.uk/gitweb/gitweb.cgi?a=blobdiff_plain;f=lib%2FUnicode%2FUCD.pm;h=96dee9a8164c03ecfbc0b8f3b4c98b2e9f36ab80;hb=cd340a5d1de2dbc931e802b4aaed98e9e4d75f51;hp=ff9cc8fc05ad3ad35ffe2dad465ca7d93b2c48d3;hpb=d1be9408a3c14848d30728674452e191ba5fffaa;p=p5sagit%2Fp5-mst-13.2.git diff --git a/lib/Unicode/UCD.pm b/lib/Unicode/UCD.pm index ff9cc8f..96dee9a 100644 --- a/lib/Unicode/UCD.pm +++ b/lib/Unicode/UCD.pm @@ -108,7 +108,7 @@ as defined by the Unicode standard: title titlecase equivalent mapping block block the character belongs to (used in \p{In...}) - script script the character belongs to + script script the character belongs to If no match is found, a reference to an empty hash is returned. @@ -204,7 +204,7 @@ sub charinfo { last; } } - openunicode(\$UNICODEFH, "Unicode.txt"); + openunicode(\$UNICODEFH, "UnicodeData.txt"); if (defined $UNICODEFH) { use Search::Dict 1.02; if (look($UNICODEFH, "$hexk;", { xfrm => sub { $_[0] =~ /^([^;]+);(.+)/; sprintf "%06X;$2", hex($1) } } ) >= 0) { @@ -280,13 +280,12 @@ positions within all blocks are defined. See also L. -If supplied with an argument that can't be a code point, charblock() -tries to do the opposite and interpret the argument as a character -block. The return value is a I: an anonymous list that -contains anonymous lists, which in turn contain I, -I code point pairs. You can test whether a code point -is in a range using the L function. If the argument is -not a known charater block, C is returned. +If supplied with an argument that can't be a code point, charblock() tries +to do the opposite and interpret the argument as a character block. The +return value is a I: an anonymous list of lists that contain +I, I code point pairs. You can test whether a +code point is in a range using the L function. If the +argument is not a known charater block, C is returned. =cut @@ -342,13 +341,12 @@ character belongs to, e.g. C, C, C. See also L. -If supplied with an argument that can't be a code point, charscript() -tries to do the opposite and interpret the argument as a character -script. The return value is a I: an anonymous list that -contains anonymous lists, which in turn contain I, -I code point pairs. You can test whether a code point -is in a range using the L function. If the argument is -not a known charater script, C is returned. +If supplied with an argument that can't be a code point, charscript() tries +to do the opposite and interpret the argument as a character script. The +return value is a I: an anonymous list of lists that contain +I, I code point pairs. You can test whether a +code point is in a range using the L function. If the +argument is not a known charater script, C is returned. =cut @@ -433,13 +431,13 @@ sub charscripts { The difference between a block and a script is that scripts are closer to the linguistic notion of a set of characters required to present languages, while block is more of an artifact of the Unicode character -numbering and separation into blocks of 256 characters. +numbering and separation into blocks of (mostly) 256 characters. For example the Latin B