Commit | Line | Data |
8e30e889 |
1 | <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> |
2 | <html xmlns="http://www.w3.org/1999/xhtml"> |
3 | <!-- |
4 | This file was generated by Devel::NYTProf version 4.06 |
5 | --> |
6 | <head> |
7 | <meta http-equiv="Content-Type" content="text/html; charset=utf-8" /> |
8 | <meta http-equiv="Content-Language" content="en-us" /> |
9 | <title>Profile of Text/TEI/Markup.pm</title> |
10 | <link rel="stylesheet" type="text/css" href="style.css" /> |
11 | <script type="text/javascript" src="js/jquery-min.js"></script> |
12 | |
13 | <script type="text/javascript" src="js/jquery-tablesorter-min.js"></script> |
14 | <link rel="stylesheet" type="text/css" href="js/style-tablesorter.css" /> |
15 | <script type="text/javascript"> |
16 | // when a column is first clicked on to sort it, use descending order |
17 | // XXX doesn't seem to work (and not just because the tablesorter formatSortingOrder() is broken) |
18 | $.tablesorter.defaults.sortInitialOrder = "desc"; |
19 | // add parser through the tablesorter addParser method |
20 | $.tablesorter.addParser({ |
21 | id: 'fmt_time', // name of this parser |
22 | is: function(s) { |
23 | return false; // return false so this parser is not auto detected |
24 | }, |
25 | format: function(orig) { // format data for normalization |
26 | // console.log(orig); |
27 | val = orig.replace(/ns/,''); |
28 | if (val != orig) { return val / (1000*1000*1000); } |
29 | val = orig.replace(/µs/,''); /* XXX use µ ? */ |
30 | if (val != orig) { return val / (1000*1000); } |
31 | var val = orig.replace(/ms/,''); |
32 | if (val != orig) { return val / (1000); } |
33 | var val = orig.replace(/s/,''); |
34 | if (val != orig) { return val; } |
35 | if (orig == '0') { return orig; } |
36 | console.log('no match for fmt_time of '.concat(orig)); |
37 | return orig; |
38 | }, |
39 | type: 'numeric' // set type, either numeric or text |
40 | }); |
41 | </script> |
42 | </head> |
43 | |
44 | <body > |
45 | <div class="header" style="position: relative; overflow-x: hidden; overflow-y: hidden; z-index: 0; "> |
46 | <div class="header_back"> |
47 | <a href="index.html">← Index</a> |
48 | </div> |
49 | <div class="headerForeground" style="float: left"> |
50 | <span class="siteTitle">NYTProf Performance Profile</span> |
51 | <span class="siteSubtitle">  <span>« <span class="mode_btn"><a href="Text-TEI-Markup-pm-1183-block.html">block view</a></span> • <span class="mode_btn mode_btn_selected">line view</span> • <span class="mode_btn"><a href="Text-TEI-Markup-pm-1183-sub.html">sub view</a></span> »</span><br /> |
52 | For script/nytprof.pl |
53 | </span> |
54 | </div> |
55 | <div class="headerForeground" style="float: right; text-align: right"> |
56 | <span class="siteTitle"> </span> |
57 | <span class="siteSubtitle">Run on Thu May 31 16:29:39 2012<br />Reported on Thu May 31 16:40:08 2012</span> |
58 | </div> |
59 | <div style="position: absolute; left: 0px; top: 0%; width: 100%; height: 101%; z-index: -1; background-color: rgb(17, 136, 255); "></div> |
60 | <div style="position: absolute; left: 0px; top: 2%; width: 100%; height: 99%; z-index: -1; background-color: rgb(16, 134, 253); "></div> |
61 | <div style="position: absolute; left: 0px; top: 4%; width: 100%; height: 97%; z-index: -1; background-color: rgb(16, 133, 252); "></div> |
62 | <div style="position: absolute; left: 0px; top: 6%; width: 100%; height: 95%; z-index: -1; background-color: rgb(15, 131, 250); "></div> |
63 | <div style="position: absolute; left: 0px; top: 8%; width: 100%; height: 93%; z-index: -1; background-color: rgb(15, 130, 249); "></div> |
64 | <div style="position: absolute; left: 0px; top: 10%; width: 100%; height: 91%; z-index: -1; background-color: rgb(15, 129, 248); "></div> |
65 | <div style="position: absolute; left: 0px; top: 12%; width: 100%; height: 89%; z-index: -1; background-color: rgb(14, 127, 246); "></div> |
66 | <div style="position: absolute; left: 0px; top: 14%; width: 100%; height: 87%; z-index: -1; background-color: rgb(14, 126, 245); "></div> |
67 | <div style="position: absolute; left: 0px; top: 16%; width: 100%; height: 85%; z-index: -1; background-color: rgb(14, 125, 244); "></div> |
68 | <div style="position: absolute; left: 0px; top: 18%; width: 100%; height: 83%; z-index: -1; background-color: rgb(13, 123, 242); "></div> |
69 | <div style="position: absolute; left: 0px; top: 20%; width: 100%; height: 81%; z-index: -1; background-color: rgb(13, 122, 241); "></div> |
70 | <div style="position: absolute; left: 0px; top: 22%; width: 100%; height: 79%; z-index: -1; background-color: rgb(13, 121, 240); "></div> |
71 | <div style="position: absolute; left: 0px; top: 24%; width: 100%; height: 77%; z-index: -1; background-color: rgb(12, 119, 238); "></div> |
72 | <div style="position: absolute; left: 0px; top: 26%; width: 100%; height: 75%; z-index: -1; background-color: rgb(12, 118, 237); "></div> |
73 | <div style="position: absolute; left: 0px; top: 28%; width: 100%; height: 73%; z-index: -1; background-color: rgb(12, 116, 235); "></div> |
74 | <div style="position: absolute; left: 0px; top: 30%; width: 100%; height: 71%; z-index: -1; background-color: rgb(11, 115, 234); "></div> |
75 | <div style="position: absolute; left: 0px; top: 32%; width: 100%; height: 69%; z-index: -1; background-color: rgb(11, 114, 233); "></div> |
76 | <div style="position: absolute; left: 0px; top: 34%; width: 100%; height: 67%; z-index: -1; background-color: rgb(11, 112, 231); "></div> |
77 | <div style="position: absolute; left: 0px; top: 36%; width: 100%; height: 65%; z-index: -1; background-color: rgb(10, 111, 230); "></div> |
78 | <div style="position: absolute; left: 0px; top: 38%; width: 100%; height: 63%; z-index: -1; background-color: rgb(10, 110, 229); "></div> |
79 | <div style="position: absolute; left: 0px; top: 40%; width: 100%; height: 61%; z-index: -1; background-color: rgb(10, 108, 227); "></div> |
80 | <div style="position: absolute; left: 0px; top: 42%; width: 100%; height: 59%; z-index: -1; background-color: rgb(9, 107, 226); "></div> |
81 | <div style="position: absolute; left: 0px; top: 44%; width: 100%; height: 57%; z-index: -1; background-color: rgb(9, 106, 225); "></div> |
82 | <div style="position: absolute; left: 0px; top: 46%; width: 100%; height: 55%; z-index: -1; background-color: rgb(9, 104, 223); "></div> |
83 | <div style="position: absolute; left: 0px; top: 48%; width: 100%; height: 53%; z-index: -1; background-color: rgb(8, 103, 222); "></div> |
84 | <div style="position: absolute; left: 0px; top: 50%; width: 100%; height: 51%; z-index: -1; background-color: rgb(8, 102, 221); "></div> |
85 | <div style="position: absolute; left: 0px; top: 52%; width: 100%; height: 49%; z-index: -1; background-color: rgb(8, 100, 219); "></div> |
86 | <div style="position: absolute; left: 0px; top: 54%; width: 100%; height: 47%; z-index: -1; background-color: rgb(7, 99, 218); "></div> |
87 | <div style="position: absolute; left: 0px; top: 56%; width: 100%; height: 45%; z-index: -1; background-color: rgb(7, 97, 216); "></div> |
88 | <div style="position: absolute; left: 0px; top: 58%; width: 100%; height: 43%; z-index: -1; background-color: rgb(7, 96, 215); "></div> |
89 | <div style="position: absolute; left: 0px; top: 60%; width: 100%; height: 41%; z-index: -1; background-color: rgb(6, 95, 214); "></div> |
90 | <div style="position: absolute; left: 0px; top: 62%; width: 100%; height: 39%; z-index: -1; background-color: rgb(6, 93, 212); "></div> |
91 | <div style="position: absolute; left: 0px; top: 64%; width: 100%; height: 37%; z-index: -1; background-color: rgb(6, 92, 211); "></div> |
92 | <div style="position: absolute; left: 0px; top: 66%; width: 100%; height: 35%; z-index: -1; background-color: rgb(5, 91, 210); "></div> |
93 | <div style="position: absolute; left: 0px; top: 68%; width: 100%; height: 33%; z-index: -1; background-color: rgb(5, 89, 208); "></div> |
94 | <div style="position: absolute; left: 0px; top: 70%; width: 100%; height: 31%; z-index: -1; background-color: rgb(5, 88, 207); "></div> |
95 | <div style="position: absolute; left: 0px; top: 72%; width: 100%; height: 29%; z-index: -1; background-color: rgb(4, 87, 206); "></div> |
96 | <div style="position: absolute; left: 0px; top: 74%; width: 100%; height: 27%; z-index: -1; background-color: rgb(4, 85, 204); "></div> |
97 | <div style="position: absolute; left: 0px; top: 76%; width: 100%; height: 25%; z-index: -1; background-color: rgb(4, 84, 203); "></div> |
98 | <div style="position: absolute; left: 0px; top: 78%; width: 100%; height: 23%; z-index: -1; background-color: rgb(3, 82, 201); "></div> |
99 | <div style="position: absolute; left: 0px; top: 80%; width: 100%; height: 21%; z-index: -1; background-color: rgb(3, 81, 200); "></div> |
100 | <div style="position: absolute; left: 0px; top: 82%; width: 100%; height: 19%; z-index: -1; background-color: rgb(3, 80, 199); "></div> |
101 | <div style="position: absolute; left: 0px; top: 84%; width: 100%; height: 17%; z-index: -1; background-color: rgb(2, 78, 197); "></div> |
102 | <div style="position: absolute; left: 0px; top: 86%; width: 100%; height: 15%; z-index: -1; background-color: rgb(2, 77, 196); "></div> |
103 | <div style="position: absolute; left: 0px; top: 88%; width: 100%; height: 13%; z-index: -1; background-color: rgb(2, 76, 195); "></div> |
104 | <div style="position: absolute; left: 0px; top: 90%; width: 100%; height: 11%; z-index: -1; background-color: rgb(1, 74, 193); "></div> |
105 | <div style="position: absolute; left: 0px; top: 92%; width: 100%; height: 9%; z-index: -1; background-color: rgb(1, 73, 192); "></div> |
106 | <div style="position: absolute; left: 0px; top: 94%; width: 100%; height: 7%; z-index: -1; background-color: rgb(1, 72, 191); "></div> |
107 | <div style="position: absolute; left: 0px; top: 96%; width: 100%; height: 5%; z-index: -1; background-color: rgb(0, 70, 189); "></div> |
108 | <div style="position: absolute; left: 0px; top: 98%; width: 100%; height: 3%; z-index: -1; background-color: rgb(0, 69, 188); "></div> |
109 | <div style="position: absolute; left: 0px; top: 100%; width: 100%; height: 1%; z-index: -1; background-color: rgb(0, 68, 187); "></div> |
110 | </div> |
111 | |
112 | <div class="body_content"><br /> |
113 | <table class="file_summary"><tr><td class="h">Filename</td><td align="left"><a href="file:///Users/edenc/perl5/lib/perl5/Text/TEI/Markup.pm">/Users/edenc/perl5/lib/perl5/Text/TEI/Markup.pm</a></td></tr> |
114 | <tr><td class="h">Statements</td><td align="left">Executed 17 statements in 2.31ms</td></tr></table> |
115 | |
116 | <table id="subs_table" border="1" cellpadding="0" class="tablesorter"> |
117 | <caption>Subroutines</caption> |
118 | <thead> |
119 | <tr> |
120 | <th>Calls</th> |
121 | <th><span title="Number of Places sub is called from">P</span></th> |
122 | <th><span title="Number of Files sub is called from">F</span></th> |
123 | <th>Exclusive<br />Time</th> |
124 | <th>Inclusive<br />Time</th> |
125 | <th>Subroutine</th> |
126 | </tr> |
127 | </thead> |
128 | <tbody> |
129 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c0"><span title="0.0%">17µs</span></td><td class="c3"><span title="0.0%">21µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@3</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#3">BEGIN@3</a></span></td></tr> |
130 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c1"><span title="0.0%">13µs</span></td><td class="c3"><span title="0.0%">27µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@433</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#433">BEGIN@433</a></span></td></tr> |
131 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c3"><span title="0.0%">11µs</span></td><td class="c0"><span title="0.0%">78µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@5</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#5">BEGIN@5</a></span></td></tr> |
132 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c3"><span title="0.0%">11µs</span></td><td class="c3"><span title="0.0%">26µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@7</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#7">BEGIN@7</a></span></td></tr> |
133 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c3"><span title="0.0%">10µs</span></td><td class="c3"><span title="0.0%">16µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@6</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#6">BEGIN@6</a></span></td></tr> |
134 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c3"><span title="0.0%">9µs</span></td><td class="c0"><span title="0.0%">206µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@8</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#8">BEGIN@8</a></span></td></tr> |
135 | <tr><td class="c3">1</td><td class="c3">1</td><td class="c3">1</td><td class="c3"><span title="0.0%">8µs</span></td><td class="c0"><span title="0.0%">54µs</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::BEGIN@4</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#4">BEGIN@4</a></span></td></tr> |
136 | <tr><td class="c3">0</td><td class="c3">0</td><td class="c3">0</td><td class="c3"><span title="0.0%">0s</span></td><td class="c3"><span title="0.0%">0s</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::_open_tag</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#441">_open_tag</a></span></td></tr> |
137 | <tr><td class="c3">0</td><td class="c3">0</td><td class="c3">0</td><td class="c3"><span title="0.0%">0s</span></td><td class="c3"><span title="0.0%">0s</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::_process_line</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#333">_process_line</a></span></td></tr> |
138 | <tr><td class="c3">0</td><td class="c3">0</td><td class="c3">0</td><td class="c3"><span title="0.0%">0s</span></td><td class="c3"><span title="0.0%">0s</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::_wrap_children</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#525">_wrap_children</a></span></td></tr> |
139 | <tr><td class="c3">0</td><td class="c3">0</td><td class="c3">0</td><td class="c3"><span title="0.0%">0s</span></td><td class="c3"><span title="0.0%">0s</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::to_xml</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#238">to_xml</a></span></td></tr> |
140 | <tr><td class="c3">0</td><td class="c3">0</td><td class="c3">0</td><td class="c3"><span title="0.0%">0s</span></td><td class="c3"><span title="0.0%">0s</span></td><td class="sub_name"><span style="display: none;">Text::TEI::Markup::::word_tag_wrap</span>Text::TEI::Markup::<a href="Text-TEI-Markup-pm-1183-line.html#486">word_tag_wrap</a></span></td></tr> |
141 | </tbody></table> |
142 | Call graph for these subroutines as a |
143 | <a href="http://en.wikipedia.org/wiki/Graphviz">Graphviz</a> |
144 | <a href="Users-edenc-perl5-lib-perl5-Text-TEI-Markup-pm.dot">dot language file</a>. |
145 | |
146 | <table border="1" cellpadding="0"> |
147 | <thead> |
148 | <tr><th>Line</th> |
149 | <th><span title="Number of statements executed">State<br />ments</span></th> |
150 | <th><span title="Time spend executing statements on the line, |
151 | excluding time spent executing statements in any called subroutines">Time<br />on line</span></th> |
152 | <th><span title="Number of subroutines calls">Calls</span></th> |
153 | <th><span title="Time spent in subroutines called (inclusive)">Time<br />in subs</span></th> |
154 | <th class="left_indent_header">Code</th> |
155 | </tr> |
156 | |
157 | </thead> |
158 | <tbody> |
159 | <tr><td class="h"><a name="1"></a>1</td><td></td><td></td><td></td><td></td><td class="s">package Text::TEI::Markup;</td></tr> |
160 | <tr><td class="h"><a name="2"></a>2</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
161 | <tr><td class="h"><a name="3"></a>3</td><td class="c3">2</td><td class="c1"><span title="Avg 17µs">34µs</span></td><td class="c3">2</td><td class="c3">26µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 21µs (17+4) within Text::TEI::Markup::BEGIN@3 which was called: |
162 | # once (17µs+4µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#3">line 3</a></div></div>use strict;<div class="calls"><div class="calls_out"># spent 21µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#3">Text::TEI::Markup::BEGIN@3</a> |
163 | # spent 4µs making 1 call to <a href="strict-pm-3-line.html#34">strict::import</a></div></div></td></tr> |
164 | <tr><td class="h"><a name="4"></a>4</td><td class="c3">2</td><td class="c3"><span title="Avg 13µs">25µs</span></td><td class="c3">2</td><td class="c0">100µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 54µs (8+46) within Text::TEI::Markup::BEGIN@4 which was called: |
165 | # once (8µs+46µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#4">line 4</a></div></div>use vars qw( $VERSION @EXPORT_OK );<div class="calls"><div class="calls_out"># spent 54µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#4">Text::TEI::Markup::BEGIN@4</a> |
166 | # spent 46µs making 1 call to <a href="vars-pm-6-line.html#10">vars::import</a></div></div></td></tr> |
167 | <tr><td class="h"><a name="5"></a>5</td><td class="c3">2</td><td class="c2"><span title="Avg 15µs">30µs</span></td><td class="c3">2</td><td class="c0">146µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 78µs (11+67) within Text::TEI::Markup::BEGIN@5 which was called: |
168 | # once (11µs+67µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#5">line 5</a></div></div>use Encode;<div class="calls"><div class="calls_out"># spent 78µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#5">Text::TEI::Markup::BEGIN@5</a> |
169 | # spent 67µs making 1 call to <a href="Exporter-pm-8-line.html#28">Exporter::import</a></div></div></td></tr> |
170 | <tr><td class="h"><a name="6"></a>6</td><td class="c3">2</td><td class="c3"><span title="Avg 12µs">25µs</span></td><td class="c3">2</td><td class="c3">22µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 16µs (10+6) within Text::TEI::Markup::BEGIN@6 which was called: |
171 | # once (10µs+6µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#6">line 6</a></div></div>use Exporter 'import';<div class="calls"><div class="calls_out"># spent 16µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#6">Text::TEI::Markup::BEGIN@6</a> |
172 | # spent 6µs making 1 call to <a href="Exporter-pm-8-line.html#28">Exporter::import</a></div></div></td></tr> |
173 | <tr><td class="h"><a name="7"></a>7</td><td class="c3">2</td><td class="c3"><span title="Avg 12µs">25µs</span></td><td class="c3">2</td><td class="c3">41µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 26µs (11+15) within Text::TEI::Markup::BEGIN@7 which was called: |
174 | # once (11µs+15µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#7">line 7</a></div></div>use Scalar::Util;<div class="calls"><div class="calls_out"># spent 26µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#7">Text::TEI::Markup::BEGIN@7</a> |
175 | # spent 15µs making 1 call to <a href="Exporter-pm-8-line.html#28">Exporter::import</a></div></div></td></tr> |
176 | <tr><td class="h"><a name="8"></a>8</td><td class="c3">2</td><td class="c0"><span title="Avg 625µs">1.25ms</span></td><td class="c3">2</td><td class="c0">402µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 206µs (9+197) within Text::TEI::Markup::BEGIN@8 which was called: |
177 | # once (9µs+197µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#8">line 8</a></div></div>use XML::LibXML;<div class="calls"><div class="calls_out"># spent 206µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#8">Text::TEI::Markup::BEGIN@8</a> |
178 | # spent 197µs making 1 call to <a href="XML-LibXML-pm-1093-line.html#182">XML::LibXML::import</a></div></div></td></tr> |
179 | <tr><td class="h"><a name="9"></a>9</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
180 | <tr><td class="h"><a name="10"></a>10</td><td class="c3">1</td><td class="c3"><span title="Avg 700ns">700ns</span></td><td></td><td></td><td class="s">$VERSION = '1.7';</td></tr> |
181 | <tr><td class="h"><a name="11"></a>11</td><td class="c3">1</td><td class="c3"><span title="Avg 1µs">1µs</span></td><td></td><td></td><td class="s">@EXPORT_OK = qw( &to_xml &word_tag_wrap );</td></tr> |
182 | <tr><td class="h"><a name="12"></a>12</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
183 | <tr><td class="h"><a name="13"></a>13</td><td></td><td></td><td></td><td></td><td class="s">=head1 NAME</td></tr> |
184 | <tr><td class="h"><a name="14"></a>14</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
185 | <tr><td class="h"><a name="15"></a>15</td><td></td><td></td><td></td><td></td><td class="s">Text::TEI::Markup - a transcription markup syntax for TEI XML</td></tr> |
186 | <tr><td class="h"><a name="16"></a>16</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
187 | <tr><td class="h"><a name="17"></a>17</td><td></td><td></td><td></td><td></td><td class="s">=head1 SYNOPSIS</td></tr> |
188 | <tr><td class="h"><a name="18"></a>18</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
189 | <tr><td class="h"><a name="19"></a>19</td><td></td><td></td><td></td><td></td><td class="s"> use Text::TEI::Markup qw( to_xml );</td></tr> |
190 | <tr><td class="h"><a name="20"></a>20</td><td></td><td></td><td></td><td></td><td class="s"> my $xml_string = to_xml( file => $markup_file, </td></tr> |
191 | <tr><td class="h"><a name="21"></a>21</td><td></td><td></td><td></td><td></td><td class="s"> template => $template_xml_string,</td></tr> |
192 | <tr><td class="h"><a name="22"></a>22</td><td></td><td></td><td></td><td></td><td class="s"> %opts ); # see below for available options</td></tr> |
193 | <tr><td class="h"><a name="23"></a>23</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
194 | <tr><td class="h"><a name="24"></a>24</td><td></td><td></td><td></td><td></td><td class="s"> use Text::TEI::Markup qw( word_tag_wrap );</td></tr> |
195 | <tr><td class="h"><a name="25"></a>25</td><td></td><td></td><td></td><td></td><td class="s"> my $word_wrapped_xml = word_tag_wrap( $tei_xml_string );</td></tr> |
196 | <tr><td class="h"><a name="26"></a>26</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
197 | <tr><td class="h"><a name="27"></a>27</td><td></td><td></td><td></td><td></td><td class="s">=head1 DESCRIPTION</td></tr> |
198 | <tr><td class="h"><a name="28"></a>28</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
199 | <tr><td class="h"><a name="29"></a>29</td><td></td><td></td><td></td><td></td><td class="s">TEI XML is a wonderful thing. The elements defined therein allow a</td></tr> |
200 | <tr><td class="h"><a name="30"></a>30</td><td></td><td></td><td></td><td></td><td class="s">transcriber to record and represent just about any feature of a text that</td></tr> |
201 | <tr><td class="h"><a name="31"></a>31</td><td></td><td></td><td></td><td></td><td class="s">he or she encounters.</td></tr> |
202 | <tr><td class="h"><a name="32"></a>32</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
203 | <tr><td class="h"><a name="33"></a>33</td><td></td><td></td><td></td><td></td><td class="s">The problem is the transcription itself. When I am transcribing a</td></tr> |
204 | <tr><td class="h"><a name="34"></a>34</td><td></td><td></td><td></td><td></td><td class="s">manuscript, especially if that manuscript is in a bunch of funny characters</td></tr> |
205 | <tr><td class="h"><a name="35"></a>35</td><td></td><td></td><td></td><td></td><td class="s">on the keymap for another language, I do not want to be switching back and</td></tr> |
206 | <tr><td class="h"><a name="36"></a>36</td><td></td><td></td><td></td><td></td><td class="s">forth between keyboard layouts in order to type "<tag attr="attr>"</td></tr> |
207 | <tr><td class="h"><a name="37"></a>37</td><td></td><td></td><td></td><td></td><td class="s">arrow-arrow-arrow-arrow-arrow "</tag> every six seconds. It's prone to</td></tr> |
208 | <tr><td class="h"><a name="38"></a>38</td><td></td><td></td><td></td><td></td><td class="s">typo, it's astonishingly slow, and it makes my wrists hurt just to think</td></tr> |
209 | <tr><td class="h"><a name="39"></a>39</td><td></td><td></td><td></td><td></td><td class="s">about it. I also don't really want to fire up an XML editor, select the</td></tr> |
210 | <tr><td class="h"><a name="40"></a>40</td><td></td><td></td><td></td><td></td><td class="s">words or characters that need to be tagged, and click a lot. That way is</td></tr> |
211 | <tr><td class="h"><a name="41"></a>41</td><td></td><td></td><td></td><td></td><td class="s">not prone to typo, but it's still pretty darn slow, and it makes my wrists</td></tr> |
212 | <tr><td class="h"><a name="42"></a>42</td><td></td><td></td><td></td><td></td><td class="s">hurt B<even more> to think about.</td></tr> |
213 | <tr><td class="h"><a name="43"></a>43</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
214 | <tr><td class="h"><a name="44"></a>44</td><td></td><td></td><td></td><td></td><td class="s">Text::TEI::Markup is my solution to that problem. It defines a bunch of</td></tr> |
215 | <tr><td class="h"><a name="45"></a>45</td><td></td><td></td><td></td><td></td><td class="s">single- or double-character sigils that represent tags. These are a lot</td></tr> |
216 | <tr><td class="h"><a name="46"></a>46</td><td></td><td></td><td></td><td></td><td class="s">faster and easier to type; I don't have to worry about typos; and I can do</td></tr> |
217 | <tr><td class="h"><a name="47"></a>47</td><td></td><td></td><td></td><td></td><td class="s">it all with a plain text editor, thus minimizing use of the mouse.</td></tr> |
218 | <tr><td class="h"><a name="48"></a>48</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
219 | <tr><td class="h"><a name="49"></a>49</td><td></td><td></td><td></td><td></td><td class="s">I have tried to pick sigils that don't conflict with characters that are</td></tr> |
220 | <tr><td class="h"><a name="50"></a>50</td><td></td><td></td><td></td><td></td><td class="s">found in manuscripts. I have succeeded for my particular set of</td></tr> |
221 | <tr><td class="h"><a name="51"></a>51</td><td></td><td></td><td></td><td></td><td class="s">manuscripts, but I have not succeeded for the general case. If you like the</td></tr> |
222 | <tr><td class="h"><a name="52"></a>52</td><td></td><td></td><td></td><td></td><td class="s">idea behind this module, you are still almost guaranteed to hate the sigils</td></tr> |
223 | <tr><td class="h"><a name="53"></a>53</td><td></td><td></td><td></td><td></td><td class="s">I've picked. That's okay; you can re-define them.</td></tr> |
224 | <tr><td class="h"><a name="54"></a>54</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
225 | <tr><td class="h"><a name="55"></a>55</td><td></td><td></td><td></td><td></td><td class="s">=head2 Extra bonus solution: word wrapping with <w/> and <seg/></td></tr> |
226 | <tr><td class="h"><a name="56"></a>56</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
227 | <tr><td class="h"><a name="57"></a>57</td><td></td><td></td><td></td><td></td><td class="s">Even if you are happy as a clam in the graphical XML editor of your choice,</td></tr> |
228 | <tr><td class="h"><a name="58"></a>58</td><td></td><td></td><td></td><td></td><td class="s">this module exports a function that may be useful to you. The TEI P5</td></tr> |
229 | <tr><td class="h"><a name="59"></a>59</td><td></td><td></td><td></td><td></td><td class="s">guidelines include a module called "analysis", which allows the user to tag</td></tr> |
230 | <tr><td class="h"><a name="60"></a>60</td><td></td><td></td><td></td><td></td><td class="s">sentences, clauses, words, morphemes, or any other sort of semantic segment</td></tr> |
231 | <tr><td class="h"><a name="61"></a>61</td><td></td><td></td><td></td><td></td><td class="s">of a text. This is really good for programmatic applications, but very</td></tr> |
232 | <tr><td class="h"><a name="62"></a>62</td><td></td><td></td><td></td><td></td><td class="s">boring and repetitive to have to tag.</td></tr> |
233 | <tr><td class="h"><a name="63"></a>63</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
234 | <tr><td class="h"><a name="64"></a>64</td><td></td><td></td><td></td><td></td><td class="s">The function B<word_tag_wrap> solves part of this problem for you. It takes</td></tr> |
235 | <tr><td class="h"><a name="65"></a>65</td><td></td><td></td><td></td><td></td><td class="s">an XML string as input, looks for words (defined by whitespace separation)</td></tr> |
236 | <tr><td class="h"><a name="66"></a>66</td><td></td><td></td><td></td><td></td><td class="s">and returns an XML string with each of these words wrapped in an</td></tr> |
237 | <tr><td class="h"><a name="67"></a>67</td><td></td><td></td><td></td><td></td><td class="s">appropriate tag. If the word has complex elements (e.g. editorial</td></tr> |
238 | <tr><td class="h"><a name="68"></a>68</td><td></td><td></td><td></td><td></td><td class="s">expansion), it will be wrapped in a <seg type="word/> tag. If not, it will</td></tr> |
239 | <tr><td class="h"><a name="69"></a>69</td><td></td><td></td><td></td><td></td><td class="s">be in a simple <w/> tag. It handles line breaks and page breaks within</td></tr> |
240 | <tr><td class="h"><a name="70"></a>70</td><td></td><td></td><td></td><td></td><td class="s">words, as long as there is no trailing whitespace before the <lb/> (or</td></tr> |
241 | <tr><td class="h"><a name="71"></a>71</td><td></td><td></td><td></td><td></td><td class="s"><pb/>) tag, and as long as the whitespace after the tag contains a carriage</td></tr> |
242 | <tr><td class="h"><a name="72"></a>72</td><td></td><td></td><td></td><td></td><td class="s">return.</td></tr> |
243 | <tr><td class="h"><a name="73"></a>73</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
244 | <tr><td class="h"><a name="74"></a>74</td><td></td><td></td><td></td><td></td><td class="s">=head1 MARKUP SYNTAX</td></tr> |
245 | <tr><td class="h"><a name="75"></a>75</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
246 | <tr><td class="h"><a name="76"></a>76</td><td></td><td></td><td></td><td></td><td class="s">The input file has a header and a body. The header begins with a '=HEAD'</td></tr> |
247 | <tr><td class="h"><a name="77"></a>77</td><td></td><td></td><td></td><td></td><td class="s">tag, and consists of a colon-separated list of key_value pairs. These keys,</td></tr> |
248 | <tr><td class="h"><a name="78"></a>78</td><td></td><td></td><td></td><td></td><td class="s">which are case insensitive, get directly substituted into an XML template;</td></tr> |
249 | <tr><td class="h"><a name="79"></a>79</td><td></td><td></td><td></td><td></td><td class="s">the idea is that your TEI header won't change very much between files, so</td></tr> |
250 | <tr><td class="h"><a name="80"></a>80</td><td></td><td></td><td></td><td></td><td class="s">you write it once with template values, pass it to &to_xml, and the</td></tr> |
251 | <tr><td class="h"><a name="81"></a>81</td><td></td><td></td><td></td><td></td><td class="s">substitution happens as if by magic. The keyword /MAIN/i is reserved for</td></tr> |
252 | <tr><td class="h"><a name="82"></a>82</td><td></td><td></td><td></td><td></td><td class="s">the content between the <body></body> tags - that is, all the content that</td></tr> |
253 | <tr><td class="h"><a name="83"></a>83</td><td></td><td></td><td></td><td></td><td class="s">will be generated after the '=BODY' tag.</td></tr> |
254 | <tr><td class="h"><a name="84"></a>84</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
255 | <tr><td class="h"><a name="85"></a>85</td><td></td><td></td><td></td><td></td><td class="s">A very simple template looks like this:</td></tr> |
256 | <tr><td class="h"><a name="86"></a>86</td><td></td><td></td><td></td><td></td><td class="s"> <?xml version="1.0" encoding="UTF-8"></td></tr> |
257 | <tr><td class="h"><a name="87"></a>87</td><td></td><td></td><td></td><td></td><td class="s"> <TEI></td></tr> |
258 | <tr><td class="h"><a name="88"></a>88</td><td></td><td></td><td></td><td></td><td class="s"> <teiHeader></td></tr> |
259 | <tr><td class="h"><a name="89"></a>89</td><td></td><td></td><td></td><td></td><td class="s"> <fileDesc></td></tr> |
260 | <tr><td class="h"><a name="90"></a>90</td><td></td><td></td><td></td><td></td><td class="s"> <titleStmt></td></tr> |
261 | <tr><td class="h"><a name="91"></a>91</td><td></td><td></td><td></td><td></td><td class="s"> <title>__TITLE__</title></td></tr> |
262 | <tr><td class="h"><a name="92"></a>92</td><td></td><td></td><td></td><td></td><td class="s"> <author__AUTHOR__</author></td></tr> |
263 | <tr><td class="h"><a name="93"></a>93</td><td></td><td></td><td></td><td></td><td class="s"> <respStmt xml:id="#__MYINITIALS__"></td></tr> |
264 | <tr><td class="h"><a name="94"></a>94</td><td></td><td></td><td></td><td></td><td class="s"> <resp>Transcription by</resp></td></tr> |
265 | <tr><td class="h"><a name="95"></a>95</td><td></td><td></td><td></td><td></td><td class="s"> <name>__MYNAME__</name></td></tr> |
266 | <tr><td class="h"><a name="96"></a>96</td><td></td><td></td><td></td><td></td><td class="s"> </respStmt></td></tr> |
267 | <tr><td class="h"><a name="97"></a>97</td><td></td><td></td><td></td><td></td><td class="s"> </titleStmt></td></tr> |
268 | <tr><td class="h"><a name="98"></a>98</td><td></td><td></td><td></td><td></td><td class="s"> </fileDesc></td></tr> |
269 | <tr><td class="h"><a name="99"></a>99</td><td></td><td></td><td></td><td></td><td class="s"> </teiHeader></td></tr> |
270 | <tr><td class="h"><a name="100"></a>100</td><td></td><td></td><td></td><td></td><td class="s"> <text></td></tr> |
271 | <tr><td class="h"><a name="101"></a>101</td><td></td><td></td><td></td><td></td><td class="s"> <body></td></tr> |
272 | <tr><td class="h"><a name="102"></a>102</td><td></td><td></td><td></td><td></td><td class="s"> __MAIN__</td></tr> |
273 | <tr><td class="h"><a name="103"></a>103</td><td></td><td></td><td></td><td></td><td class="s"> </body></td></tr> |
274 | <tr><td class="h"><a name="104"></a>104</td><td></td><td></td><td></td><td></td><td class="s"> </text></td></tr> |
275 | <tr><td class="h"><a name="105"></a>105</td><td></td><td></td><td></td><td></td><td class="s"> </TEI></td></tr> |
276 | <tr><td class="h"><a name="106"></a>106</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
277 | <tr><td class="h"><a name="107"></a>107</td><td></td><td></td><td></td><td></td><td class="s">Your input file should then begin something like this:</td></tr> |
278 | <tr><td class="h"><a name="108"></a>108</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
279 | <tr><td class="h"><a name="109"></a>109</td><td></td><td></td><td></td><td></td><td class="s"> =HEAD</td></tr> |
280 | <tr><td class="h"><a name="110"></a>110</td><td></td><td></td><td></td><td></td><td class="s"> title:My Summer Vacation: a novel</td></tr> |
281 | <tr><td class="h"><a name="111"></a>111</td><td></td><td></td><td></td><td></td><td class="s"> author:John Smith</td></tr> |
282 | <tr><td class="h"><a name="112"></a>112</td><td></td><td></td><td></td><td></td><td class="s"> myinitials:tla</td></tr> |
283 | <tr><td class="h"><a name="113"></a>113</td><td></td><td></td><td></td><td></td><td class="s"> myname:Tara L Andrews</td></tr> |
284 | <tr><td class="h"><a name="114"></a>114</td><td></td><td></td><td></td><td></td><td class="s"> =BODY</td></tr> |
285 | <tr><td class="h"><a name="115"></a>115</td><td></td><td></td><td></td><td></td><td class="s"> The ^real^ text b\e\gins +(above)t+here.</td></tr> |
286 | <tr><td class="h"><a name="116"></a>116</td><td></td><td></td><td></td><td></td><td class="s"> ...</td></tr> |
287 | <tr><td class="h"><a name="117"></a>117</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
288 | <tr><td class="h"><a name="118"></a>118</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
289 | <tr><td class="h"><a name="119"></a>119</td><td></td><td></td><td></td><td></td><td class="s">The real work begins after the '=BODY' tag. The currently-defined sigil</td></tr> |
290 | <tr><td class="h"><a name="120"></a>120</td><td></td><td></td><td></td><td></td><td class="s">list is:</td></tr> |
291 | <tr><td class="h"><a name="121"></a>121</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
292 | <tr><td class="h"><a name="122"></a>122</td><td></td><td></td><td></td><td></td><td class="s"> %SIGILS = ( </td></tr> |
293 | <tr><td class="h"><a name="123"></a>123</td><td></td><td></td><td></td><td></td><td class="s"> 'comment' => '##',</td></tr> |
294 | <tr><td class="h"><a name="124"></a>124</td><td></td><td></td><td></td><td></td><td class="s"> 'add' => '+',</td></tr> |
295 | <tr><td class="h"><a name="125"></a>125</td><td></td><td></td><td></td><td></td><td class="s"> 'del' => '-',</td></tr> |
296 | <tr><td class="h"><a name="126"></a>126</td><td></td><td></td><td></td><td></td><td class="s"> 'subst' => "\x{b1}", # Unicode PLUS-MINUS SIGN</td></tr> |
297 | <tr><td class="h"><a name="127"></a>127</td><td></td><td></td><td></td><td></td><td class="s"> 'div' => "\x{a7}", # Unicode SECTION SIGN</td></tr> |
298 | <tr><td class="h"><a name="128"></a>128</td><td></td><td></td><td></td><td></td><td class="s"> 'p' => "\x{b6}", # Unicode PILCROW SIGN</td></tr> |
299 | <tr><td class="h"><a name="129"></a>129</td><td></td><td></td><td></td><td></td><td class="s"> 'ex' => '\\',</td></tr> |
300 | <tr><td class="h"><a name="130"></a>130</td><td></td><td></td><td></td><td></td><td class="s"> 'expan' => '^',</td></tr> |
301 | <tr><td class="h"><a name="131"></a>131</td><td></td><td></td><td></td><td></td><td class="s"> 'supplied' => '@',</td></tr> |
302 | <tr><td class="h"><a name="132"></a>132</td><td></td><td></td><td></td><td></td><td class="s"> 'abbr' => [ '{', '}' ],</td></tr> |
303 | <tr><td class="h"><a name="133"></a>133</td><td></td><td></td><td></td><td></td><td class="s"> 'num' => '%',</td></tr> |
304 | <tr><td class="h"><a name="134"></a>134</td><td></td><td></td><td></td><td></td><td class="s"> 'pb' => [ '[', ']' ],</td></tr> |
305 | <tr><td class="h"><a name="135"></a>135</td><td></td><td></td><td></td><td></td><td class="s"> 'cb' => '|',</td></tr> |
306 | <tr><td class="h"><a name="136"></a>136</td><td></td><td></td><td></td><td></td><td class="s"> 'hi' => '*',</td></tr> |
307 | <tr><td class="h"><a name="137"></a>137</td><td></td><td></td><td></td><td></td><td class="s"> 'unclear' => '?',</td></tr> |
308 | <tr><td class="h"><a name="138"></a>138</td><td></td><td></td><td></td><td></td><td class="s"> 'q' => "\x{2020}", # Unicode DAGGER</td></tr> |
309 | <tr><td class="h"><a name="139"></a>139</td><td></td><td></td><td></td><td></td><td class="s"> );</td></tr> |
310 | <tr><td class="h"><a name="140"></a>140</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
311 | <tr><td class="h"><a name="141"></a>141</td><td></td><td></td><td></td><td></td><td class="s">Non-identical matched sets of sigla (e.g. '{}' for abbreviations) should be</td></tr> |
312 | <tr><td class="h"><a name="142"></a>142</td><td></td><td></td><td></td><td></td><td class="s">specified in a listref, as seen here.</td></tr> |
313 | <tr><td class="h"><a name="143"></a>143</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
314 | <tr><td class="h"><a name="144"></a>144</td><td></td><td></td><td></td><td></td><td class="s">The "add" and "del" sigils have an extra convenience feature - anything</td></tr> |
315 | <tr><td class="h"><a name="145"></a>145</td><td></td><td></td><td></td><td></td><td class="s">that appears in parentheses immediately after the add/del opening sigil ( +</td></tr> |
316 | <tr><td class="h"><a name="146"></a>146</td><td></td><td></td><td></td><td></td><td class="s">or - in the examples above) will get added as an attribute. If the string</td></tr> |
317 | <tr><td class="h"><a name="147"></a>147</td><td></td><td></td><td></td><td></td><td class="s">in parentheses has no '=' sign in it, the attribute for the "add" tag will</td></tr> |
318 | <tr><td class="h"><a name="148"></a>148</td><td></td><td></td><td></td><td></td><td class="s">be "place", and the attribute for the "del" tag will be "type". Ergo:</td></tr> |
319 | <tr><td class="h"><a name="149"></a>149</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
320 | <tr><td class="h"><a name="150"></a>150</td><td></td><td></td><td></td><td></td><td class="s"> +(margin)This is an addition+-(overwrite)and a deletion- to the sentence.</td></tr> |
321 | <tr><td class="h"><a name="151"></a>151</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
322 | <tr><td class="h"><a name="152"></a>152</td><td></td><td></td><td></td><td></td><td class="s">will get translated to</td></tr> |
323 | <tr><td class="h"><a name="153"></a>153</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
324 | <tr><td class="h"><a name="154"></a>154</td><td></td><td></td><td></td><td></td><td class="s"> <add place="margin">This is an addition</add> </td></tr> |
325 | <tr><td class="h"><a name="155"></a>155</td><td></td><td></td><td></td><td></td><td class="s"> <del type="overwrite">and a deletion</del> to the sentence.</td></tr> |
326 | <tr><td class="h"><a name="156"></a>156</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
327 | <tr><td class="h"><a name="157"></a>157</td><td></td><td></td><td></td><td></td><td class="s">This behavior ought to be more configurable and/or flexible; make it worth</td></tr> |
328 | <tr><td class="h"><a name="158"></a>158</td><td></td><td></td><td></td><td></td><td class="s">my while.</td></tr> |
329 | <tr><td class="h"><a name="159"></a>159</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
330 | <tr><td class="h"><a name="160"></a>160</td><td></td><td></td><td></td><td></td><td class="s">Whitespace is only significant at the end of lines. If a line which</td></tr> |
331 | <tr><td class="h"><a name="161"></a>161</td><td></td><td></td><td></td><td></td><td class="s">contains non-tag text (i.e. words) ends in whitespace, it is assumed that</td></tr> |
332 | <tr><td class="h"><a name="162"></a>162</td><td></td><td></td><td></td><td></td><td class="s">the previous word is a complete word. If the line ends with a</td></tr> |
333 | <tr><td class="h"><a name="163"></a>163</td><td></td><td></td><td></td><td></td><td class="s">non-whitespace character, it is assume that the word continues onto the</td></tr> |
334 | <tr><td class="h"><a name="164"></a>164</td><td></td><td></td><td></td><td></td><td class="s">next line.</td></tr> |
335 | <tr><td class="h"><a name="165"></a>165</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
336 | <tr><td class="h"><a name="166"></a>166</td><td></td><td></td><td></td><td></td><td class="s">All the sigils must be balanced, and they must nest properly. Remember that</td></tr> |
337 | <tr><td class="h"><a name="167"></a>167</td><td></td><td></td><td></td><td></td><td class="s">this is a shorthand for XML. I could be convinced to try to autocorrect</td></tr> |
338 | <tr><td class="h"><a name="168"></a>168</td><td></td><td></td><td></td><td></td><td class="s">some unbalanced sigils, but it would be worth at least a few pints of cider</td></tr> |
339 | <tr><td class="h"><a name="169"></a>169</td><td></td><td></td><td></td><td></td><td class="s">(or, of course, a patch.)</td></tr> |
340 | <tr><td class="h"><a name="170"></a>170</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
341 | <tr><td class="h"><a name="171"></a>171</td><td></td><td></td><td></td><td></td><td class="s">=head1 SUBROUTINES</td></tr> |
342 | <tr><td class="h"><a name="172"></a>172</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
343 | <tr><td class="h"><a name="173"></a>173</td><td></td><td></td><td></td><td></td><td class="s">=over 4</td></tr> |
344 | <tr><td class="h"><a name="174"></a>174</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
345 | <tr><td class="h"><a name="175"></a>175</td><td></td><td></td><td></td><td></td><td class="s">=item B<to_xml>( file => '$filename', %opts );</td></tr> |
346 | <tr><td class="h"><a name="176"></a>176</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
347 | <tr><td class="h"><a name="177"></a>177</td><td></td><td></td><td></td><td></td><td class="s">Takes the name of a file that holds a marked-up version of text. Returns a</td></tr> |
348 | <tr><td class="h"><a name="178"></a>178</td><td></td><td></td><td></td><td></td><td class="s">TEI XML string to represent that text. Options include:</td></tr> |
349 | <tr><td class="h"><a name="179"></a>179</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
350 | <tr><td class="h"><a name="180"></a>180</td><td></td><td></td><td></td><td></td><td class="s">=over 4</td></tr> |
351 | <tr><td class="h"><a name="181"></a>181</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
352 | <tr><td class="h"><a name="182"></a>182</td><td></td><td></td><td></td><td></td><td class="s">=item C<template></td></tr> |
353 | <tr><td class="h"><a name="183"></a>183</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
354 | <tr><td class="h"><a name="184"></a>184</td><td></td><td></td><td></td><td></td><td class="s">a string containing the XML template that you want to use for the markup.</td></tr> |
355 | <tr><td class="h"><a name="185"></a>185</td><td></td><td></td><td></td><td></td><td class="s">If none is specified, there is a default. That default is useful for me,</td></tr> |
356 | <tr><td class="h"><a name="186"></a>186</td><td></td><td></td><td></td><td></td><td class="s">but is very unlikely to be useful for you. =item C<fileopen_mode></td></tr> |
357 | <tr><td class="h"><a name="187"></a>187</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
358 | <tr><td class="h"><a name="188"></a>188</td><td></td><td></td><td></td><td></td><td class="s">a mode string to pass to the open() call on the file. Default "<:utf8".</td></tr> |
359 | <tr><td class="h"><a name="189"></a>189</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
360 | <tr><td class="h"><a name="190"></a>190</td><td></td><td></td><td></td><td></td><td class="s">=item C<number_conversion></td></tr> |
361 | <tr><td class="h"><a name="191"></a>191</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
362 | <tr><td class="h"><a name="192"></a>192</td><td></td><td></td><td></td><td></td><td class="s">a subroutine ref that will calculate the value of number representations.</td></tr> |
363 | <tr><td class="h"><a name="193"></a>193</td><td></td><td></td><td></td><td></td><td class="s">Useful for, e.g., Latin numerals. This is optional - if nothing is passed,</td></tr> |
364 | <tr><td class="h"><a name="194"></a>194</td><td></td><td></td><td></td><td></td><td class="s">no number value calculation will be attempted. =item C<sigils></td></tr> |
365 | <tr><td class="h"><a name="195"></a>195</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
366 | <tr><td class="h"><a name="196"></a>196</td><td></td><td></td><td></td><td></td><td class="s">a hashref containing the preferred sigil representations of TEI tags.</td></tr> |
367 | <tr><td class="h"><a name="197"></a>197</td><td></td><td></td><td></td><td></td><td class="s">Defaults to the list above. =item C<wrap_words></td></tr> |
368 | <tr><td class="h"><a name="198"></a>198</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
369 | <tr><td class="h"><a name="199"></a>199</td><td></td><td></td><td></td><td></td><td class="s">Defaults to "true". If you pass a false value, the word wrapping will be</td></tr> |
370 | <tr><td class="h"><a name="200"></a>200</td><td></td><td></td><td></td><td></td><td class="s">skipped. </td></tr> |
371 | <tr><td class="h"><a name="201"></a>201</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
372 | <tr><td class="h"><a name="202"></a>202</td><td></td><td></td><td></td><td></td><td class="s">=item C<format></td></tr> |
373 | <tr><td class="h"><a name="203"></a>203</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
374 | <tr><td class="h"><a name="204"></a>204</td><td></td><td></td><td></td><td></td><td class="s">Defaults to 0. Controls whether rudimentary formatting is applied to the</td></tr> |
375 | <tr><td class="h"><a name="205"></a>205</td><td></td><td></td><td></td><td></td><td class="s">XML returned. Possible values are 0, 1, and "more than 1". See</td></tr> |
376 | <tr><td class="h"><a name="206"></a>206</td><td></td><td></td><td></td><td></td><td class="s">XML::LibXML::Document::serialize for more information. (Personally I just</td></tr> |
377 | <tr><td class="h"><a name="207"></a>207</td><td></td><td></td><td></td><td></td><td class="s">xmllint it separately.)</td></tr> |
378 | <tr><td class="h"><a name="208"></a>208</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
379 | <tr><td class="h"><a name="209"></a>209</td><td></td><td></td><td></td><td></td><td class="s">=back</td></tr> |
380 | <tr><td class="h"><a name="210"></a>210</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
381 | <tr><td class="h"><a name="211"></a>211</td><td></td><td></td><td></td><td></td><td class="s">The return string is run through the basic formatting mechanism provided by</td></tr> |
382 | <tr><td class="h"><a name="212"></a>212</td><td></td><td></td><td></td><td></td><td class="s">XML::LibXML. You may wish to pass it through a pretty printer more to your</td></tr> |
383 | <tr><td class="h"><a name="213"></a>213</td><td></td><td></td><td></td><td></td><td class="s">taste. </td></tr> |
384 | <tr><td class="h"><a name="214"></a>214</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
385 | <tr><td class="h"><a name="215"></a>215</td><td></td><td></td><td></td><td></td><td class="s">=cut</td></tr> |
386 | <tr><td class="h"><a name="216"></a>216</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
387 | <tr><td class="h"><a name="217"></a>217</td><td></td><td></td><td></td><td></td><td class="s"># Default list of funky signs I use.</td></tr> |
388 | <tr><td class="h"><a name="218"></a>218</td><td></td><td></td><td></td><td></td><td class="s"># TODO: Add header support</td></tr> |
389 | <tr><td class="h"><a name="219"></a>219</td><td class="c3">1</td><td class="c3"><span title="Avg 25µs">25µs</span></td><td></td><td></td><td class="s">my %SIGILS = ( </td></tr> |
390 | <tr><td class="h"><a name="220"></a>220</td><td></td><td></td><td></td><td></td><td class="s"> 'comment' => '##',</td></tr> |
391 | <tr><td class="h"><a name="221"></a>221</td><td></td><td></td><td></td><td></td><td class="s"> 'add' => '+',</td></tr> |
392 | <tr><td class="h"><a name="222"></a>222</td><td></td><td></td><td></td><td></td><td class="s"> 'del' => '-',</td></tr> |
393 | <tr><td class="h"><a name="223"></a>223</td><td></td><td></td><td></td><td></td><td class="s"> 'subst' => "\x{b1}",</td></tr> |
394 | <tr><td class="h"><a name="224"></a>224</td><td></td><td></td><td></td><td></td><td class="s"> 'div' => "\x{a7}",</td></tr> |
395 | <tr><td class="h"><a name="225"></a>225</td><td></td><td></td><td></td><td></td><td class="s"> 'p' => "\x{b6}",</td></tr> |
396 | <tr><td class="h"><a name="226"></a>226</td><td></td><td></td><td></td><td></td><td class="s"> 'ex' => '\\',</td></tr> |
397 | <tr><td class="h"><a name="227"></a>227</td><td></td><td></td><td></td><td></td><td class="s"> 'expan' => '^',</td></tr> |
398 | <tr><td class="h"><a name="228"></a>228</td><td></td><td></td><td></td><td></td><td class="s"> 'supplied' => '@',</td></tr> |
399 | <tr><td class="h"><a name="229"></a>229</td><td></td><td></td><td></td><td></td><td class="s"> 'abbr' => [ '{', '}' ],</td></tr> |
400 | <tr><td class="h"><a name="230"></a>230</td><td></td><td></td><td></td><td></td><td class="s"> 'num' => '%',</td></tr> |
401 | <tr><td class="h"><a name="231"></a>231</td><td></td><td></td><td></td><td></td><td class="s"> 'pb' => [ '[', ']' ],</td></tr> |
402 | <tr><td class="h"><a name="232"></a>232</td><td></td><td></td><td></td><td></td><td class="s"> 'cb' => '|',</td></tr> |
403 | <tr><td class="h"><a name="233"></a>233</td><td></td><td></td><td></td><td></td><td class="s"> 'hi' => '*',</td></tr> |
404 | <tr><td class="h"><a name="234"></a>234</td><td></td><td></td><td></td><td></td><td class="s"> 'unclear' => '?',</td></tr> |
405 | <tr><td class="h"><a name="235"></a>235</td><td></td><td></td><td></td><td></td><td class="s"> 'q' => "\x{2020}",</td></tr> |
406 | <tr><td class="h"><a name="236"></a>236</td><td></td><td></td><td></td><td></td><td class="s"> );</td></tr> |
407 | <tr><td class="h"><a name="237"></a>237</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
408 | <tr><td class="h"><a name="238"></a>238</td><td></td><td></td><td></td><td></td><td class="s">sub to_xml {</td></tr> |
409 | <tr><td class="h"><a name="239"></a>239</td><td></td><td></td><td></td><td></td><td class="s"> my %opts = (</td></tr> |
410 | <tr><td class="h"><a name="240"></a>240</td><td></td><td></td><td></td><td></td><td class="s"> 'number_conversion' => undef,</td></tr> |
411 | <tr><td class="h"><a name="241"></a>241</td><td></td><td></td><td></td><td></td><td class="s"> 'fileopen_mode' => '<:utf8',</td></tr> |
412 | <tr><td class="h"><a name="242"></a>242</td><td></td><td></td><td></td><td></td><td class="s"> 'wrap_words' => 1,</td></tr> |
413 | <tr><td class="h"><a name="243"></a>243</td><td></td><td></td><td></td><td></td><td class="s"> 'sigils' => \%SIGILS,</td></tr> |
414 | <tr><td class="h"><a name="244"></a>244</td><td></td><td></td><td></td><td></td><td class="s"> 'template' => undef,</td></tr> |
415 | <tr><td class="h"><a name="245"></a>245</td><td></td><td></td><td></td><td></td><td class="s"> 'format' => 0,</td></tr> |
416 | <tr><td class="h"><a name="246"></a>246</td><td></td><td></td><td></td><td></td><td class="s"> @_,</td></tr> |
417 | <tr><td class="h"><a name="247"></a>247</td><td></td><td></td><td></td><td></td><td class="s"> );</td></tr> |
418 | <tr><td class="h"><a name="248"></a>248</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
419 | <tr><td class="h"><a name="249"></a>249</td><td></td><td></td><td></td><td></td><td class="s"> unless( defined( $opts{'file'} ) ) {</td></tr> |
420 | <tr><td class="h"><a name="250"></a>250</td><td></td><td></td><td></td><td></td><td class="s"> warn "No file specified! Doing nothing.";</td></tr> |
421 | <tr><td class="h"><a name="251"></a>251</td><td></td><td></td><td></td><td></td><td class="s"> return undef;</td></tr> |
422 | <tr><td class="h"><a name="252"></a>252</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
423 | <tr><td class="h"><a name="253"></a>253</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
424 | <tr><td class="h"><a name="254"></a>254</td><td></td><td></td><td></td><td></td><td class="s"> if( ref( $opts{'number_conversion'} ) ne 'CODE' ) {</td></tr> |
425 | <tr><td class="h"><a name="255"></a>255</td><td></td><td></td><td></td><td></td><td class="s"> warn "number_conversion argument must be a subroutine ref";</td></tr> |
426 | <tr><td class="h"><a name="256"></a>256</td><td></td><td></td><td></td><td></td><td class="s"> $opts{'number_conversion'} = undef;</td></tr> |
427 | <tr><td class="h"><a name="257"></a>257</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
428 | <tr><td class="h"><a name="258"></a>258</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
429 | <tr><td class="h"><a name="259"></a>259</td><td></td><td></td><td></td><td></td><td class="s"> my $inbody;</td></tr> |
430 | <tr><td class="h"><a name="260"></a>260</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
431 | <tr><td class="h"><a name="261"></a>261</td><td></td><td></td><td></td><td></td><td class="s"> my $rc = open( FILE, $opts{'fileopen_mode'}, $opts{'file'} );</td></tr> |
432 | <tr><td class="h"><a name="262"></a>262</td><td></td><td></td><td></td><td></td><td class="s"> unless( $rc ) {</td></tr> |
433 | <tr><td class="h"><a name="263"></a>263</td><td></td><td></td><td></td><td></td><td class="s"> warn "Could not open $opts{'file'}: $@";</td></tr> |
434 | <tr><td class="h"><a name="264"></a>264</td><td></td><td></td><td></td><td></td><td class="s"> return undef;</td></tr> |
435 | <tr><td class="h"><a name="265"></a>265</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
436 | <tr><td class="h"><a name="266"></a>266</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
437 | <tr><td class="h"><a name="267"></a>267</td><td></td><td></td><td></td><td></td><td class="s"> my $tmpl;</td></tr> |
438 | <tr><td class="h"><a name="268"></a>268</td><td></td><td></td><td></td><td></td><td class="s"> if( defined $opts{'template'} ) {</td></tr> |
439 | <tr><td class="h"><a name="269"></a>269</td><td></td><td></td><td></td><td></td><td class="s"> $tmpl = $opts{'template'};</td></tr> |
440 | <tr><td class="h"><a name="270"></a>270</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
441 | <tr><td class="h"><a name="271"></a>271</td><td></td><td></td><td></td><td></td><td class="s"> my @tmpl_lines = <DATA>;</td></tr> |
442 | <tr><td class="h"><a name="272"></a>272</td><td></td><td></td><td></td><td></td><td class="s"> $tmpl = join( '', @tmpl_lines );</td></tr> |
443 | <tr><td class="h"><a name="273"></a>273</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
444 | <tr><td class="h"><a name="274"></a>274</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
445 | <tr><td class="h"><a name="275"></a>275</td><td></td><td></td><td></td><td></td><td class="s"> my $main_xml;</td></tr> |
446 | <tr><td class="h"><a name="276"></a>276</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
447 | <tr><td class="h"><a name="277"></a>277</td><td></td><td></td><td></td><td></td><td class="s"> my( $in_p, $in_div ) = ( undef, undef );</td></tr> |
448 | <tr><td class="h"><a name="278"></a>278</td><td></td><td></td><td></td><td></td><td class="s"> while(<FILE>) {</td></tr> |
449 | <tr><td class="h"><a name="279"></a>279</td><td></td><td></td><td></td><td></td><td class="s"> chomp;</td></tr> |
450 | <tr><td class="h"><a name="280"></a>280</td><td></td><td></td><td></td><td></td><td class="s"> next if /^\s*$/;</td></tr> |
451 | <tr><td class="h"><a name="281"></a>281</td><td></td><td></td><td></td><td></td><td class="s"> s/^\s*//;</td></tr> |
452 | <tr><td class="h"><a name="282"></a>282</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
453 | <tr><td class="h"><a name="283"></a>283</td><td></td><td></td><td></td><td></td><td class="s"> if( /^=BODY/ ) {</td></tr> |
454 | <tr><td class="h"><a name="284"></a>284</td><td></td><td></td><td></td><td></td><td class="s"> $inbody = 1;</td></tr> |
455 | <tr><td class="h"><a name="285"></a>285</td><td></td><td></td><td></td><td></td><td class="s"> # Have we found a responsible person?</td></tr> |
456 | <tr><td class="h"><a name="286"></a>286</td><td></td><td></td><td></td><td></td><td class="s"> unless( exists $opts{'resp'} ) {</td></tr> |
457 | <tr><td class="h"><a name="287"></a>287</td><td></td><td></td><td></td><td></td><td class="s"> warn "No responsible person specified for edits!";</td></tr> |
458 | <tr><td class="h"><a name="288"></a>288</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
459 | <tr><td class="h"><a name="289"></a>289</td><td></td><td></td><td></td><td></td><td class="s"> next;</td></tr> |
460 | <tr><td class="h"><a name="290"></a>290</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
461 | <tr><td class="h"><a name="291"></a>291</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
462 | <tr><td class="h"><a name="292"></a>292</td><td></td><td></td><td></td><td></td><td class="s"> if( /^(\w+):(.*)$/ ) {</td></tr> |
463 | <tr><td class="h"><a name="293"></a>293</td><td></td><td></td><td></td><td></td><td class="s"> # Make the header template substitution.</td></tr> |
464 | <tr><td class="h"><a name="294"></a>294</td><td></td><td></td><td></td><td></td><td class="s"> warn "Warning: header line $_ in body section" if $inbody;</td></tr> |
465 | <tr><td class="h"><a name="295"></a>295</td><td></td><td></td><td></td><td></td><td class="s"> my( $key, $val ) = ( lc( $1 ), $2 );</td></tr> |
466 | <tr><td class="h"><a name="296"></a>296</td><td></td><td></td><td></td><td></td><td class="s"> if( $key eq 'main' ) {</td></tr> |
467 | <tr><td class="h"><a name="297"></a>297</td><td></td><td></td><td></td><td></td><td class="s"> warn "Illegal key $key; not substituting";</td></tr> |
468 | <tr><td class="h"><a name="298"></a>298</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
469 | <tr><td class="h"><a name="299"></a>299</td><td></td><td></td><td></td><td></td><td class="s"> $tmpl =~ s/__${key}__/$val/gi;</td></tr> |
470 | <tr><td class="h"><a name="300"></a>300</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
471 | <tr><td class="h"><a name="301"></a>301</td><td></td><td></td><td></td><td></td><td class="s"> if( $key eq 'transcriberid' ) {</td></tr> |
472 | <tr><td class="h"><a name="302"></a>302</td><td></td><td></td><td></td><td></td><td class="s"> $opts{'resp'} = '#' . $val;</td></tr> |
473 | <tr><td class="h"><a name="303"></a>303</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
474 | <tr><td class="h"><a name="304"></a>304</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
475 | <tr><td class="h"><a name="305"></a>305</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
476 | <tr><td class="h"><a name="306"></a>306</td><td></td><td></td><td></td><td></td><td class="s"> if( $inbody ) {</td></tr> |
477 | <tr><td class="h"><a name="307"></a>307</td><td></td><td></td><td></td><td></td><td class="s"> # Send it to the parser.</td></tr> |
478 | <tr><td class="h"><a name="308"></a>308</td><td></td><td></td><td></td><td></td><td class="s"> my $line;</td></tr> |
479 | <tr><td class="h"><a name="309"></a>309</td><td></td><td></td><td></td><td></td><td class="s"> ## TODO: Upgrade to perl 5.10 to get state variables.</td></tr> |
480 | <tr><td class="h"><a name="310"></a>310</td><td></td><td></td><td></td><td></td><td class="s"> ( $line, $in_div, $in_p ) = _process_line( $_, $in_div, $in_p, %opts );</td></tr> |
481 | <tr><td class="h"><a name="311"></a>311</td><td></td><td></td><td></td><td></td><td class="s"> $main_xml .= $line;</td></tr> |
482 | <tr><td class="h"><a name="312"></a>312</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
483 | <tr><td class="h"><a name="313"></a>313</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
484 | <tr><td class="h"><a name="314"></a>314</td><td></td><td></td><td></td><td></td><td class="s"> close FILE;</td></tr> |
485 | <tr><td class="h"><a name="315"></a>315</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
486 | <tr><td class="h"><a name="316"></a>316</td><td></td><td></td><td></td><td></td><td class="s"> $tmpl =~ s/__MAIN__/$main_xml/;</td></tr> |
487 | <tr><td class="h"><a name="317"></a>317</td><td></td><td></td><td></td><td></td><td class="s"> if( $opts{'wrap_words'} ) {</td></tr> |
488 | <tr><td class="h"><a name="318"></a>318</td><td></td><td></td><td></td><td></td><td class="s"> $tmpl = word_tag_wrap( $tmpl, $opts{'format'} );</td></tr> |
489 | <tr><td class="h"><a name="319"></a>319</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
490 | <tr><td class="h"><a name="320"></a>320</td><td></td><td></td><td></td><td></td><td class="s"> # Just make sure it parses, and format it if asked.</td></tr> |
491 | <tr><td class="h"><a name="321"></a>321</td><td></td><td></td><td></td><td></td><td class="s"> my $parser = XML::LibXML->new();</td></tr> |
492 | <tr><td class="h"><a name="322"></a>322</td><td></td><td></td><td></td><td></td><td class="s"> my $doc;</td></tr> |
493 | <tr><td class="h"><a name="323"></a>323</td><td></td><td></td><td></td><td></td><td class="s"> my $ok = eval{ $doc = $parser->parse_string( $tmpl ); };</td></tr> |
494 | <tr><td class="h"><a name="324"></a>324</td><td></td><td></td><td></td><td></td><td class="s"> unless( $ok ) {</td></tr> |
495 | <tr><td class="h"><a name="325"></a>325</td><td></td><td></td><td></td><td></td><td class="s"> warn "Parsing of new XML doc failed: $@";</td></tr> |
496 | <tr><td class="h"><a name="326"></a>326</td><td></td><td></td><td></td><td></td><td class="s"> return undef;</td></tr> |
497 | <tr><td class="h"><a name="327"></a>327</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
498 | <tr><td class="h"><a name="328"></a>328</td><td></td><td></td><td></td><td></td><td class="s"> $tmpl = decode( $doc->encoding, $doc->serialize( $opts{'format'} ) );</td></tr> |
499 | <tr><td class="h"><a name="329"></a>329</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
500 | <tr><td class="h"><a name="330"></a>330</td><td></td><td></td><td></td><td></td><td class="s"> return $tmpl;</td></tr> |
501 | <tr><td class="h"><a name="331"></a>331</td><td></td><td></td><td></td><td></td><td class="s">}</td></tr> |
502 | <tr><td class="h"><a name="332"></a>332</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
503 | <tr><td class="h"><a name="333"></a>333</td><td></td><td></td><td></td><td></td><td class="s">sub _process_line {</td></tr> |
504 | <tr><td class="h"><a name="334"></a>334</td><td></td><td></td><td></td><td></td><td class="s"> my( $line, $in_div, $in_p, %opts ) = @_;</td></tr> |
505 | <tr><td class="h"><a name="335"></a>335</td><td></td><td></td><td></td><td></td><td class="s"> chomp $line;</td></tr> |
506 | <tr><td class="h"><a name="336"></a>336</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
507 | <tr><td class="h"><a name="337"></a>337</td><td></td><td></td><td></td><td></td><td class="s"> # Look for paragraph and div markers. </td></tr> |
508 | <tr><td class="h"><a name="338"></a>338</td><td></td><td></td><td></td><td></td><td class="s"> my $sigils = $opts{'sigils'};</td></tr> |
509 | <tr><td class="h"><a name="339"></a>339</td><td></td><td></td><td></td><td></td><td class="s"> my( $divsig, $pgsig ) = ( $sigils->{'div'}, $sigils->{'p'} );</td></tr> |
510 | <tr><td class="h"><a name="340"></a>340</td><td></td><td></td><td></td><td></td><td class="s"> while( $line =~ /\Q$divsig\E(\d*)/g ) { </td></tr> |
511 | <tr><td class="h"><a name="341"></a>341</td><td></td><td></td><td></td><td></td><td class="s"> my $divno = $1;</td></tr> |
512 | <tr><td class="h"><a name="342"></a>342</td><td></td><td></td><td></td><td></td><td class="s"> # Calculate the starting position.</td></tr> |
513 | <tr><td class="h"><a name="343"></a>343</td><td></td><td></td><td></td><td></td><td class="s"> my $pos = pos( $line ) - 1;</td></tr> |
514 | <tr><td class="h"><a name="344"></a>344</td><td></td><td></td><td></td><td></td><td class="s"> $pos -= length( $divno ) if $divno;</td></tr> |
515 | <tr><td class="h"><a name="345"></a>345</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
516 | <tr><td class="h"><a name="346"></a>346</td><td></td><td></td><td></td><td></td><td class="s"> if( $in_div ) {</td></tr> |
517 | <tr><td class="h"><a name="347"></a>347</td><td></td><td></td><td></td><td></td><td class="s"> warn "Nonsensical division number at end-division tag"</td></tr> |
518 | <tr><td class="h"><a name="348"></a>348</td><td></td><td></td><td></td><td></td><td class="s"> if $divno;</td></tr> |
519 | <tr><td class="h"><a name="349"></a>349</td><td></td><td></td><td></td><td></td><td class="s"> substr( $line, $pos, 1, '</div>' );</td></tr> |
520 | <tr><td class="h"><a name="350"></a>350</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
521 | <tr><td class="h"><a name="351"></a>351</td><td></td><td></td><td></td><td></td><td class="s"> my $divstr = '<div' . ( $divno ? " n=\"$divno\"" : '' ) . ">";</td></tr> |
522 | <tr><td class="h"><a name="352"></a>352</td><td></td><td></td><td></td><td></td><td class="s"> substr( $line, $pos, pos( $line ) - $pos, $divstr );</td></tr> |
523 | <tr><td class="h"><a name="353"></a>353</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
524 | <tr><td class="h"><a name="354"></a>354</td><td></td><td></td><td></td><td></td><td class="s"> $in_div = !$in_div;</td></tr> |
525 | <tr><td class="h"><a name="355"></a>355</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
526 | <tr><td class="h"><a name="356"></a>356</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
527 | <tr><td class="h"><a name="357"></a>357</td><td></td><td></td><td></td><td></td><td class="s"> while( $line =~ /\Q$pgsig\E/g ) {</td></tr> |
528 | <tr><td class="h"><a name="358"></a>358</td><td></td><td></td><td></td><td></td><td class="s"> my $p_str = '<' . ( $in_p ? '/' : '' ) . 'p>';</td></tr> |
529 | <tr><td class="h"><a name="359"></a>359</td><td></td><td></td><td></td><td></td><td class="s"> substr( $line, pos( $line ) - 1, 1, $p_str );</td></tr> |
530 | <tr><td class="h"><a name="360"></a>360</td><td></td><td></td><td></td><td></td><td class="s"> $in_p = !$in_p;</td></tr> |
531 | <tr><td class="h"><a name="361"></a>361</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
532 | <tr><td class="h"><a name="362"></a>362</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
533 | <tr><td class="h"><a name="363"></a>363</td><td></td><td></td><td></td><td></td><td class="s"> # Add and delete tags. Do this first so that we do not stomp later</td></tr> |
534 | <tr><td class="h"><a name="364"></a>364</td><td></td><td></td><td></td><td></td><td class="s"> # instances of the dash (e.g. in XML comments).</td></tr> |
535 | <tr><td class="h"><a name="365"></a>365</td><td></td><td></td><td></td><td></td><td class="s"> while( $line =~ m|([-+])(\(([^\)]+)\))?(.*?)\1|g ) {</td></tr> |
536 | <tr><td class="h"><a name="366"></a>366</td><td></td><td></td><td></td><td></td><td class="s"> my( $op, $attr, $word ) = ( $1, $3, $4 );</td></tr> |
537 | <tr><td class="h"><a name="367"></a>367</td><td></td><td></td><td></td><td></td><td class="s"> # Calculate starting position.</td></tr> |
538 | <tr><td class="h"><a name="368"></a>368</td><td></td><td></td><td></td><td></td><td class="s"> my $pos = pos( $line ) - ( length( $word ) + 2 );</td></tr> |
539 | <tr><td class="h"><a name="369"></a>369</td><td></td><td></td><td></td><td></td><td class="s"> $pos -= ( length( $attr ) + 2 ) if $attr;</td></tr> |
540 | <tr><td class="h"><a name="370"></a>370</td><td></td><td></td><td></td><td></td><td class="s"> # Figure out what the attribute string, if any, should be.</td></tr> |
541 | <tr><td class="h"><a name="371"></a>371</td><td></td><td></td><td></td><td></td><td class="s"> my $attr_str;</td></tr> |
542 | <tr><td class="h"><a name="372"></a>372</td><td></td><td></td><td></td><td></td><td class="s"> if( $attr && $attr =~ /\=/ ) {</td></tr> |
543 | <tr><td class="h"><a name="373"></a>373</td><td></td><td></td><td></td><td></td><td class="s"> $attr_str = $attr;</td></tr> |
544 | <tr><td class="h"><a name="374"></a>374</td><td></td><td></td><td></td><td></td><td class="s"> } elsif ( $attr ) {</td></tr> |
545 | <tr><td class="h"><a name="375"></a>375</td><td></td><td></td><td></td><td></td><td class="s"> $attr_str = ( $op eq '+' ? "place" : "type" ) </td></tr> |
546 | <tr><td class="h"><a name="376"></a>376</td><td></td><td></td><td></td><td></td><td class="s"> . "=\"$attr\"";</td></tr> |
547 | <tr><td class="h"><a name="377"></a>377</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
548 | <tr><td class="h"><a name="378"></a>378</td><td></td><td></td><td></td><td></td><td class="s"> my $interp_str = '<' . ( $op eq '+' ? 'add' : 'del' )</td></tr> |
549 | <tr><td class="h"><a name="379"></a>379</td><td></td><td></td><td></td><td></td><td class="s"> . ( $attr_str ? " $attr_str" : '' )</td></tr> |
550 | <tr><td class="h"><a name="380"></a>380</td><td></td><td></td><td></td><td></td><td class="s"> . ">$word</" . ( $op eq '+' ? 'add' : 'del' ) . '>';</td></tr> |
551 | <tr><td class="h"><a name="381"></a>381</td><td></td><td></td><td></td><td></td><td class="s"> substr( $line, $pos, pos( $line ) - $pos, $interp_str );</td></tr> |
552 | <tr><td class="h"><a name="382"></a>382</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
553 | <tr><td class="h"><a name="383"></a>383</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
554 | <tr><td class="h"><a name="384"></a>384</td><td></td><td></td><td></td><td></td><td class="s"> # All the tags that are not very special cases.</td></tr> |
555 | <tr><td class="h"><a name="385"></a>385</td><td></td><td></td><td></td><td></td><td class="s"> foreach my $tag ( qw( subst abbr hi ex expan num unclear q supplied ) ) {</td></tr> |
556 | <tr><td class="h"><a name="386"></a>386</td><td></td><td></td><td></td><td></td><td class="s"> my $tag_sig = $sigils->{$tag};</td></tr> |
557 | <tr><td class="h"><a name="387"></a>387</td><td></td><td></td><td></td><td></td><td class="s"> my( $tag_open, $tag_close );</td></tr> |
558 | <tr><td class="h"><a name="388"></a>388</td><td></td><td></td><td></td><td></td><td class="s"> if( ref( $tag_sig ) eq 'ARRAY' ) {</td></tr> |
559 | <tr><td class="h"><a name="389"></a>389</td><td></td><td></td><td></td><td></td><td class="s"> ( $tag_open, $tag_close ) = @$tag_sig;</td></tr> |
560 | <tr><td class="h"><a name="390"></a>390</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
561 | <tr><td class="h"><a name="391"></a>391</td><td></td><td></td><td></td><td></td><td class="s"> $tag_open = $tag_close = $tag_sig;</td></tr> |
562 | <tr><td class="h"><a name="392"></a>392</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
563 | <tr><td class="h"><a name="393"></a>393</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
564 | <tr><td class="h"><a name="394"></a>394</td><td></td><td></td><td></td><td></td><td class="s"> $line =~ s|\Q$tag_open\E(.*?)\Q$tag_close\E|_open_tag( $tag, $1, \%opts ) . "</$tag>"|ge;</td></tr> |
565 | <tr><td class="h"><a name="395"></a>395</td><td></td><td></td><td></td><td></td><td class="s"> } </td></tr> |
566 | <tr><td class="h"><a name="396"></a>396</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
567 | <tr><td class="h"><a name="397"></a>397</td><td></td><td></td><td></td><td></td><td class="s"> # Standalone tags that aren't special cases. Currently only cb.</td></tr> |
568 | <tr><td class="h"><a name="398"></a>398</td><td></td><td></td><td></td><td></td><td class="s"> foreach my $tag ( qw( cb ) ) {</td></tr> |
569 | <tr><td class="h"><a name="399"></a>399</td><td></td><td></td><td></td><td></td><td class="s"> my $tag_sig = $sigils->{$tag}; </td></tr> |
570 | <tr><td class="h"><a name="400"></a>400</td><td></td><td></td><td></td><td></td><td class="s"> $line =~ s|\Q$tag_sig\E|"<$tag/>"|ge;</td></tr> |
571 | <tr><td class="h"><a name="401"></a>401</td><td></td><td></td><td></td><td></td><td class="s"> } </td></tr> |
572 | <tr><td class="h"><a name="402"></a>402</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
573 | <tr><td class="h"><a name="403"></a>403</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
574 | <tr><td class="h"><a name="404"></a>404</td><td></td><td></td><td></td><td></td><td class="s"> # Page breaks. Defined by the delimiters, plus an optional</td></tr> |
575 | <tr><td class="h"><a name="405"></a>405</td><td></td><td></td><td></td><td></td><td class="s"> # page/folio number & recto/verso indicator, on a line by itself.</td></tr> |
576 | <tr><td class="h"><a name="406"></a>406</td><td></td><td></td><td></td><td></td><td class="s"> # Of course other languages may use other sigils to indicate recto</td></tr> |
577 | <tr><td class="h"><a name="407"></a>407</td><td></td><td></td><td></td><td></td><td class="s"> # verso, so do not look for 'r' and 'v' specifically.</td></tr> |
578 | <tr><td class="h"><a name="408"></a>408</td><td></td><td></td><td></td><td></td><td class="s"> my $pb_sig = $sigils->{'pb'};</td></tr> |
579 | <tr><td class="h"><a name="409"></a>409</td><td></td><td></td><td></td><td></td><td class="s"> my ( $pb_open, $pb_close );</td></tr> |
580 | <tr><td class="h"><a name="410"></a>410</td><td></td><td></td><td></td><td></td><td class="s"> if( ref( $pb_sig ) eq 'ARRAY' ) {</td></tr> |
581 | <tr><td class="h"><a name="411"></a>411</td><td></td><td></td><td></td><td></td><td class="s"> ( $pb_open, $pb_close ) = @$pb_sig;</td></tr> |
582 | <tr><td class="h"><a name="412"></a>412</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
583 | <tr><td class="h"><a name="413"></a>413</td><td></td><td></td><td></td><td></td><td class="s"> $pb_open = $pb_sig;</td></tr> |
584 | <tr><td class="h"><a name="414"></a>414</td><td></td><td></td><td></td><td></td><td class="s"> $pb_close = $pb_sig;</td></tr> |
585 | <tr><td class="h"><a name="415"></a>415</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
586 | <tr><td class="h"><a name="416"></a>416</td><td></td><td></td><td></td><td></td><td class="s"> $line =~ s|^\Q$pb_open\E(\d+(.)?)\Q$pb_close\E\s*$|<pb n=\"$1\"/>|;</td></tr> |
587 | <tr><td class="h"><a name="417"></a>417</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
588 | <tr><td class="h"><a name="418"></a>418</td><td></td><td></td><td></td><td></td><td class="s"> # XML comments. Convert ## text ## to <!-- text --></td></tr> |
589 | <tr><td class="h"><a name="419"></a>419</td><td></td><td></td><td></td><td></td><td class="s"> my $com_sig = $sigils->{'comment'};</td></tr> |
590 | <tr><td class="h"><a name="420"></a>420</td><td></td><td></td><td></td><td></td><td class="s"> my ( $com_open, $com_close );</td></tr> |
591 | <tr><td class="h"><a name="421"></a>421</td><td></td><td></td><td></td><td></td><td class="s"> if( ref( $com_sig ) eq 'ARRAY' ) {</td></tr> |
592 | <tr><td class="h"><a name="422"></a>422</td><td></td><td></td><td></td><td></td><td class="s"> ( $com_open, $com_close ) = @$com_sig;</td></tr> |
593 | <tr><td class="h"><a name="423"></a>423</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
594 | <tr><td class="h"><a name="424"></a>424</td><td></td><td></td><td></td><td></td><td class="s"> $com_open = $com_close = $com_sig;</td></tr> |
595 | <tr><td class="h"><a name="425"></a>425</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
596 | <tr><td class="h"><a name="426"></a>426</td><td></td><td></td><td></td><td></td><td class="s"> $line =~ s|\Q$com_open\E(.*?)\Q$com_close\E|<!--$1-->|g;</td></tr> |
597 | <tr><td class="h"><a name="427"></a>427</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
598 | <tr><td class="h"><a name="428"></a>428</td><td></td><td></td><td></td><td></td><td class="s"> # Finally, every line with text outside an XML tag must have a line</td></tr> |
599 | <tr><td class="h"><a name="429"></a>429</td><td></td><td></td><td></td><td></td><td class="s"> # break. Any lb tag should be inside a cb, p, or div tag.</td></tr> |
600 | <tr><td class="h"><a name="430"></a>430</td><td></td><td></td><td></td><td></td><td class="s"> my $testline = $line;</td></tr> |
601 | <tr><td class="h"><a name="431"></a>431</td><td></td><td></td><td></td><td></td><td class="s"> $testline =~ s/<[^>]*>//g;</td></tr> |
602 | <tr><td class="h"><a name="432"></a>432</td><td></td><td></td><td></td><td></td><td class="s"> if( $testline =~ /\S/ ) {</td></tr> |
603 | <tr><td class="h"><a name="433"></a>433</td><td class="c3">2</td><td class="c0"><span title="Avg 446µs">892µs</span></td><td class="c3">2</td><td class="c3">41µs</td><td class="s"><div class="calls"><div class="calls_in"># spent 27µs (13+14) within Text::TEI::Markup::BEGIN@433 which was called: |
604 | # once (13µs+14µs) by Text::Tradition::Witness::BEGIN@7 at <a href="Text-TEI-Markup-pm-1183-line.html#433">line 433</a></div></div> no warnings 'uninitialized';<div class="calls"><div class="calls_out"> # spent 27µs making 1 call to <a href="Text-TEI-Markup-pm-1183-line.html#433">Text::TEI::Markup::BEGIN@433</a> |
605 | # spent 14µs making 1 call to <a href="warnings-pm-2-line.html#401">warnings::unimport</a></div></div></td></tr> |
606 | <tr><td class="h"><a name="434"></a>434</td><td></td><td></td><td></td><td></td><td class="s"> $line =~ s!(</p>|</div>|<cb/>)?$!<lb/>$1!;</td></tr> |
607 | <tr><td class="h"><a name="435"></a>435</td><td></td><td></td><td></td><td></td><td class="s"> } </td></tr> |
608 | <tr><td class="h"><a name="436"></a>436</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
609 | <tr><td class="h"><a name="437"></a>437</td><td></td><td></td><td></td><td></td><td class="s"> # Return the expanded line.</td></tr> |
610 | <tr><td class="h"><a name="438"></a>438</td><td></td><td></td><td></td><td></td><td class="s"> return( "$line\n", $in_div, $in_p );</td></tr> |
611 | <tr><td class="h"><a name="439"></a>439</td><td></td><td></td><td></td><td></td><td class="s">}</td></tr> |
612 | <tr><td class="h"><a name="440"></a>440</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
613 | <tr><td class="h"><a name="441"></a>441</td><td></td><td></td><td></td><td></td><td class="s">sub _open_tag {</td></tr> |
614 | <tr><td class="h"><a name="442"></a>442</td><td></td><td></td><td></td><td></td><td class="s"> my( $tag, $text, $opts ) = @_;</td></tr> |
615 | <tr><td class="h"><a name="443"></a>443</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
616 | <tr><td class="h"><a name="444"></a>444</td><td></td><td></td><td></td><td></td><td class="s"> my $opened_tag;</td></tr> |
617 | <tr><td class="h"><a name="445"></a>445</td><td></td><td></td><td></td><td></td><td class="s"> # Does the tag take a parenthesized argument?</td></tr> |
618 | <tr><td class="h"><a name="446"></a>446</td><td></td><td></td><td></td><td></td><td class="s"> my $arg = '';</td></tr> |
619 | <tr><td class="h"><a name="447"></a>447</td><td></td><td></td><td></td><td></td><td class="s"> if( $text =~ /^\(([^\)]+)\)(.*)$/ ) {</td></tr> |
620 | <tr><td class="h"><a name="448"></a>448</td><td></td><td></td><td></td><td></td><td class="s"> ( $arg, $text ) = ( $1, $2 );</td></tr> |
621 | <tr><td class="h"><a name="449"></a>449</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
622 | <tr><td class="h"><a name="450"></a>450</td><td></td><td></td><td></td><td></td><td class="s"> if( $tag =~ /^(ex|expan|supplied)$/ ) {</td></tr> |
623 | <tr><td class="h"><a name="451"></a>451</td><td></td><td></td><td></td><td></td><td class="s"> # It takes a resp agent.</td></tr> |
624 | <tr><td class="h"><a name="452"></a>452</td><td></td><td></td><td></td><td></td><td class="s"> $opened_tag = '<'. $tag .' resp="' . $opts->{'resp'} . "\">$text";</td></tr> |
625 | <tr><td class="h"><a name="453"></a>453</td><td></td><td></td><td></td><td></td><td class="s"> } elsif ( $tag eq 'q' ) {</td></tr> |
626 | <tr><td class="h"><a name="454"></a>454</td><td></td><td></td><td></td><td></td><td class="s"> # Special case - we mean a biblical quote.</td></tr> |
627 | <tr><td class="h"><a name="455"></a>455</td><td></td><td></td><td></td><td></td><td class="s"> $opened_tag = '<q type="biblical">' . $text;</td></tr> |
628 | <tr><td class="h"><a name="456"></a>456</td><td></td><td></td><td></td><td></td><td class="s"> } elsif ( $tag eq 'num' ) {</td></tr> |
629 | <tr><td class="h"><a name="457"></a>457</td><td></td><td></td><td></td><td></td><td class="s"> # Derive the number's value if requested.</td></tr> |
630 | <tr><td class="h"><a name="458"></a>458</td><td></td><td></td><td></td><td></td><td class="s"> my $numconvert = $opts->{'number_conversion'};</td></tr> |
631 | <tr><td class="h"><a name="459"></a>459</td><td></td><td></td><td></td><td></td><td class="s"> if( defined $numconvert ) {</td></tr> |
632 | <tr><td class="h"><a name="460"></a>460</td><td></td><td></td><td></td><td></td><td class="s"> my $nv = &$numconvert( $text );</td></tr> |
633 | <tr><td class="h"><a name="461"></a>461</td><td></td><td></td><td></td><td></td><td class="s"> $opened_tag = "<num value=\"$nv\">$text" if defined $nv;</td></tr> |
634 | <tr><td class="h"><a name="462"></a>462</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
635 | <tr><td class="h"><a name="463"></a>463</td><td></td><td></td><td></td><td></td><td class="s"> } elsif ( $tag eq 'hi' ) {</td></tr> |
636 | <tr><td class="h"><a name="464"></a>464</td><td></td><td></td><td></td><td></td><td class="s"> warn "Empty argument passed to $tag tag" unless $arg;</td></tr> |
637 | <tr><td class="h"><a name="465"></a>465</td><td></td><td></td><td></td><td></td><td class="s"> $opened_tag = sprintf( '<%s rend="%s">%s', $tag, $arg, $text );</td></tr> |
638 | <tr><td class="h"><a name="466"></a>466</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
639 | <tr><td class="h"><a name="467"></a>467</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
640 | <tr><td class="h"><a name="468"></a>468</td><td></td><td></td><td></td><td></td><td class="s"> # The default</td></tr> |
641 | <tr><td class="h"><a name="469"></a>469</td><td></td><td></td><td></td><td></td><td class="s"> $opened_tag = "<$tag>$text" unless $opened_tag;</td></tr> |
642 | <tr><td class="h"><a name="470"></a>470</td><td></td><td></td><td></td><td></td><td class="s"> return $opened_tag;</td></tr> |
643 | <tr><td class="h"><a name="471"></a>471</td><td></td><td></td><td></td><td></td><td class="s">}</td></tr> |
644 | <tr><td class="h"><a name="472"></a>472</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
645 | <tr><td class="h"><a name="473"></a>473</td><td></td><td></td><td></td><td></td><td class="s">=item B<word_tag_wrap>( $xml_string )</td></tr> |
646 | <tr><td class="h"><a name="474"></a>474</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
647 | <tr><td class="h"><a name="475"></a>475</td><td></td><td></td><td></td><td></td><td class="s">Takes a string containing a TEI XML document, and returns that</td></tr> |
648 | <tr><td class="h"><a name="476"></a>476</td><td></td><td></td><td></td><td></td><td class="s">document with all its words wrapped in <w/> (or <seg/>) tags. A</td></tr> |
649 | <tr><td class="h"><a name="477"></a>477</td><td></td><td></td><td></td><td></td><td class="s">"word" is defined as a series of text characters separated by</td></tr> |
650 | <tr><td class="h"><a name="478"></a>478</td><td></td><td></td><td></td><td></td><td class="s">whitespace. A word can have a line break, or even a page break, in</td></tr> |
651 | <tr><td class="h"><a name="479"></a>479</td><td></td><td></td><td></td><td></td><td class="s">the middle; if this is the case, there I<may not> be any whitespace</td></tr> |
652 | <tr><td class="h"><a name="480"></a>480</td><td></td><td></td><td></td><td></td><td class="s">between the end of the first word segment and the <lb/> (or <pb/>)</td></tr> |
653 | <tr><td class="h"><a name="481"></a>481</td><td></td><td></td><td></td><td></td><td class="s">tag. Conversely, there I<must> be whitespace separating the <lb/> (or</td></tr> |
654 | <tr><td class="h"><a name="482"></a>482</td><td></td><td></td><td></td><td></td><td class="s"><pb/>) from a complete word.</td></tr> |
655 | <tr><td class="h"><a name="483"></a>483</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
656 | <tr><td class="h"><a name="484"></a>484</td><td></td><td></td><td></td><td></td><td class="s">=cut</td></tr> |
657 | <tr><td class="h"><a name="485"></a>485</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
658 | <tr><td class="h"><a name="486"></a>486</td><td></td><td></td><td></td><td></td><td class="s">sub word_tag_wrap {</td></tr> |
659 | <tr><td class="h"><a name="487"></a>487</td><td></td><td></td><td></td><td></td><td class="s"> my( $xml, $format ) = @_;</td></tr> |
660 | <tr><td class="h"><a name="488"></a>488</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
661 | <tr><td class="h"><a name="489"></a>489</td><td></td><td></td><td></td><td></td><td class="s"> my $ret;</td></tr> |
662 | <tr><td class="h"><a name="490"></a>490</td><td></td><td></td><td></td><td></td><td class="s"> my $doc;</td></tr> |
663 | <tr><td class="h"><a name="491"></a>491</td><td></td><td></td><td></td><td></td><td class="s"> my $root;</td></tr> |
664 | <tr><td class="h"><a name="492"></a>492</td><td></td><td></td><td></td><td></td><td class="s"> if( !ref( $xml ) ) {</td></tr> |
665 | <tr><td class="h"><a name="493"></a>493</td><td></td><td></td><td></td><td></td><td class="s"> $ret = 'string';</td></tr> |
666 | <tr><td class="h"><a name="494"></a>494</td><td></td><td></td><td></td><td></td><td class="s"> my $parser = XML::LibXML->new();</td></tr> |
667 | <tr><td class="h"><a name="495"></a>495</td><td></td><td></td><td></td><td></td><td class="s"> $doc = $parser->parse_string( $xml );</td></tr> |
668 | <tr><td class="h"><a name="496"></a>496</td><td></td><td></td><td></td><td></td><td class="s"> $root = $doc->getDocumentElement();</td></tr> |
669 | <tr><td class="h"><a name="497"></a>497</td><td></td><td></td><td></td><td></td><td class="s"> } elsif( ref( $xml ) eq 'XML::LibXML::Document' ) {</td></tr> |
670 | <tr><td class="h"><a name="498"></a>498</td><td></td><td></td><td></td><td></td><td class="s"> $ret = 'xml';</td></tr> |
671 | <tr><td class="h"><a name="499"></a>499</td><td></td><td></td><td></td><td></td><td class="s"> $root = $xml->getDocumentElement();</td></tr> |
672 | <tr><td class="h"><a name="500"></a>500</td><td></td><td></td><td></td><td></td><td class="s"> } elsif( ref( $xml ) eq 'XML::LibXML::Element' ) {</td></tr> |
673 | <tr><td class="h"><a name="501"></a>501</td><td></td><td></td><td></td><td></td><td class="s"> $ret = 'xml';</td></tr> |
674 | <tr><td class="h"><a name="502"></a>502</td><td></td><td></td><td></td><td></td><td class="s"> $root = $xml;</td></tr> |
675 | <tr><td class="h"><a name="503"></a>503</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
676 | <tr><td class="h"><a name="504"></a>504</td><td></td><td></td><td></td><td></td><td class="s"> die "Passed argument is neither string, Document, or Element";</td></tr> |
677 | <tr><td class="h"><a name="505"></a>505</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
678 | <tr><td class="h"><a name="506"></a>506</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
679 | <tr><td class="h"><a name="507"></a>507</td><td></td><td></td><td></td><td></td><td class="s"> my @textnodes = $root->getElementsByTagName( 'text' );</td></tr> |
680 | <tr><td class="h"><a name="508"></a>508</td><td></td><td></td><td></td><td></td><td class="s"> my %paragraphs; # Cope with the fact that text nodes can be recursive</td></tr> |
681 | <tr><td class="h"><a name="509"></a>509</td><td></td><td></td><td></td><td></td><td class="s"> foreach my $t ( @textnodes ) {</td></tr> |
682 | <tr><td class="h"><a name="510"></a>510</td><td></td><td></td><td></td><td></td><td class="s"> map { $paragraphs{Scalar::Util::refaddr( $_ )} = $_ } $t->getElementsByTagName( 'p' );</td></tr> |
683 | <tr><td class="h"><a name="511"></a>511</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
684 | <tr><td class="h"><a name="512"></a>512</td><td></td><td></td><td></td><td></td><td class="s"> foreach my $p ( values %paragraphs ) {</td></tr> |
685 | <tr><td class="h"><a name="513"></a>513</td><td></td><td></td><td></td><td></td><td class="s"> my $new_p = _wrap_children( $p );</td></tr> |
686 | <tr><td class="h"><a name="514"></a>514</td><td></td><td></td><td></td><td></td><td class="s"> $p->replaceNode( $new_p );</td></tr> |
687 | <tr><td class="h"><a name="515"></a>515</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
688 | <tr><td class="h"><a name="516"></a>516</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
689 | <tr><td class="h"><a name="517"></a>517</td><td></td><td></td><td></td><td></td><td class="s"> # Annoyingly, we have to decode the encoding that takes place when</td></tr> |
690 | <tr><td class="h"><a name="518"></a>518</td><td></td><td></td><td></td><td></td><td class="s"> # the string is returned.</td></tr> |
691 | <tr><td class="h"><a name="519"></a>519</td><td></td><td></td><td></td><td></td><td class="s"> if( $ret eq 'string' ) {</td></tr> |
692 | <tr><td class="h"><a name="520"></a>520</td><td></td><td></td><td></td><td></td><td class="s"> $format = 0 unless $format;</td></tr> |
693 | <tr><td class="h"><a name="521"></a>521</td><td></td><td></td><td></td><td></td><td class="s"> return decode( $doc->encoding(), $doc->serialize( $format ) );</td></tr> |
694 | <tr><td class="h"><a name="522"></a>522</td><td></td><td></td><td></td><td></td><td class="s"> } # else the doc has been modified and we need return nothing.</td></tr> |
695 | <tr><td class="h"><a name="523"></a>523</td><td></td><td></td><td></td><td></td><td class="s">}</td></tr> |
696 | <tr><td class="h"><a name="524"></a>524</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
697 | <tr><td class="h"><a name="525"></a>525</td><td></td><td></td><td></td><td></td><td class="s">sub _wrap_children {</td></tr> |
698 | <tr><td class="h"><a name="526"></a>526</td><td></td><td></td><td></td><td></td><td class="s"> my $node = shift;</td></tr> |
699 | <tr><td class="h"><a name="527"></a>527</td><td></td><td></td><td></td><td></td><td class="s"> my @children = $node->childNodes;</td></tr> |
700 | <tr><td class="h"><a name="528"></a>528</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
701 | <tr><td class="h"><a name="529"></a>529</td><td></td><td></td><td></td><td></td><td class="s"> my $new_node = XML::LibXML::Element->new( $node->nodeName );</td></tr> |
702 | <tr><td class="h"><a name="530"></a>530</td><td></td><td></td><td></td><td></td><td class="s"> # Set the namespace</td></tr> |
703 | <tr><td class="h"><a name="531"></a>531</td><td></td><td></td><td></td><td></td><td class="s"> my $docns = $node->namespaceURI;</td></tr> |
704 | <tr><td class="h"><a name="532"></a>532</td><td></td><td></td><td></td><td></td><td class="s"> $new_node->setNamespace( $docns );</td></tr> |
705 | <tr><td class="h"><a name="533"></a>533</td><td></td><td></td><td></td><td></td><td class="s"> my $open_word_node = undef;</td></tr> |
706 | <tr><td class="h"><a name="534"></a>534</td><td></td><td></td><td></td><td></td><td class="s"> foreach my $c ( @children ) {</td></tr> |
707 | <tr><td class="h"><a name="535"></a>535</td><td></td><td></td><td></td><td></td><td class="s"> # Is it a text node?</td></tr> |
708 | <tr><td class="h"><a name="536"></a>536</td><td></td><td></td><td></td><td></td><td class="s"> if( ref( $c ) eq 'XML::LibXML::Text' ) {</td></tr> |
709 | <tr><td class="h"><a name="537"></a>537</td><td></td><td></td><td></td><td></td><td class="s"> # Get the text.</td></tr> |
710 | <tr><td class="h"><a name="538"></a>538</td><td></td><td></td><td></td><td></td><td class="s"> my $str = $c->textContent;</td></tr> |
711 | <tr><td class="h"><a name="539"></a>539</td><td></td><td></td><td></td><td></td><td class="s"> # Strip out carriage returns and their surrounding spaces.</td></tr> |
712 | <tr><td class="h"><a name="540"></a>540</td><td></td><td></td><td></td><td></td><td class="s"> # Carriage returns should only occur after <lb/> elements,</td></tr> |
713 | <tr><td class="h"><a name="541"></a>541</td><td></td><td></td><td></td><td></td><td class="s"> # and the spaces around them should therefore be insignificant.</td></tr> |
714 | <tr><td class="h"><a name="542"></a>542</td><td></td><td></td><td></td><td></td><td class="s"> $str =~ s/^\s*\n\s*//gs;</td></tr> |
715 | <tr><td class="h"><a name="543"></a>543</td><td></td><td></td><td></td><td></td><td class="s"> # If there is nothing at all but a newline + initial spaces,</td></tr> |
716 | <tr><td class="h"><a name="544"></a>544</td><td></td><td></td><td></td><td></td><td class="s"> # pretend that the node isn't there at all.</td></tr> |
717 | <tr><td class="h"><a name="545"></a>545</td><td></td><td></td><td></td><td></td><td class="s"> next unless $str;</td></tr> |
718 | <tr><td class="h"><a name="546"></a>546</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
719 | <tr><td class="h"><a name="547"></a>547</td><td></td><td></td><td></td><td></td><td class="s"> # Get the individual words.</td></tr> |
720 | <tr><td class="h"><a name="548"></a>548</td><td></td><td></td><td></td><td></td><td class="s"> my @words = split( /\s+/, $str );</td></tr> |
721 | <tr><td class="h"><a name="549"></a>549</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
722 | <tr><td class="h"><a name="550"></a>550</td><td></td><td></td><td></td><td></td><td class="s"> # Finish out the last word if we need to.</td></tr> |
723 | <tr><td class="h"><a name="551"></a>551</td><td></td><td></td><td></td><td></td><td class="s"> if( $open_word_node ) {</td></tr> |
724 | <tr><td class="h"><a name="552"></a>552</td><td></td><td></td><td></td><td></td><td class="s"> # If there are any words in this text string, the</td></tr> |
725 | <tr><td class="h"><a name="553"></a>553</td><td></td><td></td><td></td><td></td><td class="s"> # first one should be used to close out the open node.</td></tr> |
726 | <tr><td class="h"><a name="554"></a>554</td><td></td><td></td><td></td><td></td><td class="s"> # If the first word is empty, it's a space and the</td></tr> |
727 | <tr><td class="h"><a name="555"></a>555</td><td></td><td></td><td></td><td></td><td class="s"> # word should just be closed. If there are no words</td></tr> |
728 | <tr><td class="h"><a name="556"></a>556</td><td></td><td></td><td></td><td></td><td class="s"> # at all, it was just a space. If the first word was</td></tr> |
729 | <tr><td class="h"><a name="557"></a>557</td><td></td><td></td><td></td><td></td><td class="s"> # all there is, we haven't encountered a space yet and</td></tr> |
730 | <tr><td class="h"><a name="558"></a>558</td><td></td><td></td><td></td><td></td><td class="s"> # need to keep the word open.</td></tr> |
731 | <tr><td class="h"><a name="559"></a>559</td><td></td><td></td><td></td><td></td><td class="s"> if( @words ) {</td></tr> |
732 | <tr><td class="h"><a name="560"></a>560</td><td></td><td></td><td></td><td></td><td class="s"> my $first = shift @words;</td></tr> |
733 | <tr><td class="h"><a name="561"></a>561</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node->appendText( $first ) if $first;</td></tr> |
734 | <tr><td class="h"><a name="562"></a>562</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
735 | <tr><td class="h"><a name="563"></a>563</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node = undef unless @words;</td></tr> |
736 | <tr><td class="h"><a name="564"></a>564</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
737 | <tr><td class="h"><a name="565"></a>565</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
738 | <tr><td class="h"><a name="566"></a>566</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
739 | <tr><td class="h"><a name="567"></a>567</td><td></td><td></td><td></td><td></td><td class="s"> foreach( @words ) {</td></tr> |
740 | <tr><td class="h"><a name="568"></a>568</td><td></td><td></td><td></td><td></td><td class="s"> # Skip whitespace "words"</td></tr> |
741 | <tr><td class="h"><a name="569"></a>569</td><td></td><td></td><td></td><td></td><td class="s"> next unless /\S/;</td></tr> |
742 | <tr><td class="h"><a name="570"></a>570</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
743 | <tr><td class="h"><a name="571"></a>571</td><td></td><td></td><td></td><td></td><td class="s"> # Make a new node for the word</td></tr> |
744 | <tr><td class="h"><a name="572"></a>572</td><td></td><td></td><td></td><td></td><td class="s"> my $word_node = XML::LibXML::Element->new( 'w' );</td></tr> |
745 | <tr><td class="h"><a name="573"></a>573</td><td></td><td></td><td></td><td></td><td class="s"> $word_node->setNamespace( $docns );</td></tr> |
746 | <tr><td class="h"><a name="574"></a>574</td><td></td><td></td><td></td><td></td><td class="s"> $word_node->appendText( $_ );</td></tr> |
747 | <tr><td class="h"><a name="575"></a>575</td><td></td><td></td><td></td><td></td><td class="s"> $new_node->appendChild( $word_node );</td></tr> |
748 | <tr><td class="h"><a name="576"></a>576</td><td></td><td></td><td></td><td></td><td class="s"> # ...and keep it open until we find a new word or a space</td></tr> |
749 | <tr><td class="h"><a name="577"></a>577</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node = $word_node;</td></tr> |
750 | <tr><td class="h"><a name="578"></a>578</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
751 | <tr><td class="h"><a name="579"></a>579</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
752 | <tr><td class="h"><a name="580"></a>580</td><td></td><td></td><td></td><td></td><td class="s"> # Close the last word node if our text node ends in a space.</td></tr> |
753 | <tr><td class="h"><a name="581"></a>581</td><td></td><td></td><td></td><td></td><td class="s"> if( $str =~ /\s+$/s ) {</td></tr> |
754 | <tr><td class="h"><a name="582"></a>582</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node = undef;</td></tr> |
755 | <tr><td class="h"><a name="583"></a>583</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
756 | <tr><td class="h"><a name="584"></a>584</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
757 | <tr><td class="h"><a name="585"></a>585</td><td></td><td></td><td></td><td></td><td class="s"> my $wrapped_child;</td></tr> |
758 | <tr><td class="h"><a name="586"></a>586</td><td></td><td></td><td></td><td></td><td class="s"> if ( ref( $c ) ne 'XML::LibXML::Comment' && $c->textContent ne ''</td></tr> |
759 | <tr><td class="h"><a name="587"></a>587</td><td></td><td></td><td></td><td></td><td class="s"> && $c->textContent =~ /\s+/ ) {</td></tr> |
760 | <tr><td class="h"><a name="588"></a>588</td><td></td><td></td><td></td><td></td><td class="s"> # Recurse on any node that itself contains whitespace-separated text.</td></tr> |
761 | <tr><td class="h"><a name="589"></a>589</td><td></td><td></td><td></td><td></td><td class="s"> my $new_c = _wrap_children( $c );</td></tr> |
762 | <tr><td class="h"><a name="590"></a>590</td><td></td><td></td><td></td><td></td><td class="s"> $wrapped_child = ( $c->toString() ne $new_c->toString() );</td></tr> |
763 | <tr><td class="h"><a name="591"></a>591</td><td></td><td></td><td></td><td></td><td class="s"> $c = $new_c;</td></tr> |
764 | <tr><td class="h"><a name="592"></a>592</td><td></td><td></td><td></td><td></td><td class="s"> } </td></tr> |
765 | <tr><td class="h"><a name="593"></a>593</td><td></td><td></td><td></td><td></td><td class="s"> </td></tr> |
766 | <tr><td class="h"><a name="594"></a>594</td><td></td><td></td><td></td><td></td><td class="s"> # If there is an open word node, make it a seg and append</td></tr> |
767 | <tr><td class="h"><a name="595"></a>595</td><td></td><td></td><td></td><td></td><td class="s"> # our result there; if the child has text content but no</td></tr> |
768 | <tr><td class="h"><a name="596"></a>596</td><td></td><td></td><td></td><td></td><td class="s"> # word children, wrap it in a new seg; otherwise just pass</td></tr> |
769 | <tr><td class="h"><a name="597"></a>597</td><td></td><td></td><td></td><td></td><td class="s"> # it on through.</td></tr> |
770 | <tr><td class="h"><a name="598"></a>598</td><td></td><td></td><td></td><td></td><td class="s"> if( $open_word_node ) {</td></tr> |
771 | <tr><td class="h"><a name="599"></a>599</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node->setNodeName( 'seg' );</td></tr> |
772 | <tr><td class="h"><a name="600"></a>600</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node->setAttribute( 'type', 'word' );</td></tr> |
773 | <tr><td class="h"><a name="601"></a>601</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node->appendChild( $c );</td></tr> |
774 | <tr><td class="h"><a name="602"></a>602</td><td></td><td></td><td></td><td></td><td class="s"> } elsif( ref( $c ) eq 'XML::LibXML::Comment' || $c->textContent eq '' </td></tr> |
775 | <tr><td class="h"><a name="603"></a>603</td><td></td><td></td><td></td><td></td><td class="s"> || $wrapped_child ) {</td></tr> |
776 | <tr><td class="h"><a name="604"></a>604</td><td></td><td></td><td></td><td></td><td class="s"> $new_node->appendChild( $c );</td></tr> |
777 | <tr><td class="h"><a name="605"></a>605</td><td></td><td></td><td></td><td></td><td class="s"> } else {</td></tr> |
778 | <tr><td class="h"><a name="606"></a>606</td><td></td><td></td><td></td><td></td><td class="s"> my $segment_node = XML::LibXML::Element->new( 'seg' );</td></tr> |
779 | <tr><td class="h"><a name="607"></a>607</td><td></td><td></td><td></td><td></td><td class="s"> $segment_node->setNamespace( $docns );</td></tr> |
780 | <tr><td class="h"><a name="608"></a>608</td><td></td><td></td><td></td><td></td><td class="s"> $segment_node->setAttribute( 'type', 'word' );</td></tr> |
781 | <tr><td class="h"><a name="609"></a>609</td><td></td><td></td><td></td><td></td><td class="s"> $segment_node->appendChild( $c );</td></tr> |
782 | <tr><td class="h"><a name="610"></a>610</td><td></td><td></td><td></td><td></td><td class="s"> $new_node->appendChild( $segment_node );</td></tr> |
783 | <tr><td class="h"><a name="611"></a>611</td><td></td><td></td><td></td><td></td><td class="s"> # Keep it open in case there is not a leading space on the next</td></tr> |
784 | <tr><td class="h"><a name="612"></a>612</td><td></td><td></td><td></td><td></td><td class="s"> # text node.</td></tr> |
785 | <tr><td class="h"><a name="613"></a>613</td><td></td><td></td><td></td><td></td><td class="s"> $open_word_node = $segment_node;</td></tr> |
786 | <tr><td class="h"><a name="614"></a>614</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
787 | <tr><td class="h"><a name="615"></a>615</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
788 | <tr><td class="h"><a name="616"></a>616</td><td></td><td></td><td></td><td></td><td class="s"> }</td></tr> |
789 | <tr><td class="h"><a name="617"></a>617</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
790 | <tr><td class="h"><a name="618"></a>618</td><td></td><td></td><td></td><td></td><td class="s"> return $new_node; </td></tr> |
791 | <tr><td class="h"><a name="619"></a>619</td><td></td><td></td><td></td><td></td><td class="s">}</td></tr> |
792 | <tr><td class="h"><a name="620"></a>620</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
793 | <tr><td class="h"><a name="621"></a>621</td><td></td><td></td><td></td><td></td><td class="s">=back</td></tr> |
794 | <tr><td class="h"><a name="622"></a>622</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
795 | <tr><td class="h"><a name="623"></a>623</td><td></td><td></td><td></td><td></td><td class="s">=head1 BUGS / TODO</td></tr> |
796 | <tr><td class="h"><a name="624"></a>624</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
797 | <tr><td class="h"><a name="625"></a>625</td><td></td><td></td><td></td><td></td><td class="s">The XML is not currently validated against a schema. This is mostly</td></tr> |
798 | <tr><td class="h"><a name="626"></a>626</td><td></td><td></td><td></td><td></td><td class="s">because I have been unable to get RelaxNG validation to work against</td></tr> |
799 | <tr><td class="h"><a name="627"></a>627</td><td></td><td></td><td></td><td></td><td class="s">certain TEI schemas.</td></tr> |
800 | <tr><td class="h"><a name="628"></a>628</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
801 | <tr><td class="h"><a name="629"></a>629</td><td></td><td></td><td></td><td></td><td class="s">This module is currently in a state that I know to be useful to me.</td></tr> |
802 | <tr><td class="h"><a name="630"></a>630</td><td></td><td></td><td></td><td></td><td class="s">If it looks like it might be useful to you, but something is bugging</td></tr> |
803 | <tr><td class="h"><a name="631"></a>631</td><td></td><td></td><td></td><td></td><td class="s">you about it, report it!</td></tr> |
804 | <tr><td class="h"><a name="632"></a>632</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
805 | <tr><td class="h"><a name="633"></a>633</td><td></td><td></td><td></td><td></td><td class="s">=head1 LICENSE</td></tr> |
806 | <tr><td class="h"><a name="634"></a>634</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
807 | <tr><td class="h"><a name="635"></a>635</td><td></td><td></td><td></td><td></td><td class="s">This package is free software and is provided "as is" without express</td></tr> |
808 | <tr><td class="h"><a name="636"></a>636</td><td></td><td></td><td></td><td></td><td class="s">or implied warranty. You can redistribute it and/or modify it under</td></tr> |
809 | <tr><td class="h"><a name="637"></a>637</td><td></td><td></td><td></td><td></td><td class="s">the same terms as Perl itself.</td></tr> |
810 | <tr><td class="h"><a name="638"></a>638</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
811 | <tr><td class="h"><a name="639"></a>639</td><td></td><td></td><td></td><td></td><td class="s">=head1 AUTHOR</td></tr> |
812 | <tr><td class="h"><a name="640"></a>640</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
813 | <tr><td class="h"><a name="641"></a>641</td><td></td><td></td><td></td><td></td><td class="s">Tara L Andrews, L<aurum@cpan.org></td></tr> |
814 | <tr><td class="h"><a name="642"></a>642</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
815 | <tr><td class="h"><a name="643"></a>643</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
816 | <tr><td class="h"><a name="644"></a>644</td><td></td><td></td><td></td><td></td><td class="s">=cut</td></tr> |
817 | <tr><td class="h"><a name="645"></a>645</td><td></td><td></td><td></td><td></td><td class="s"></td></tr> |
818 | <tr><td class="h"><a name="646"></a>646</td><td></td><td></td><td></td><td></td><td class="s">__DATA__</td></tr> |
819 | </tbody></table></div> |
820 | |
821 | <script type="text/javascript"> $(document).ready(function() { |
822 | |
823 | $("#subs_table").tablesorter({ |
824 | sortList: [[3,1]], |
825 | headers: { |
826 | 3: { sorter: 'fmt_time' }, |
827 | 4: { sorter: 'fmt_time' } |
828 | } |
829 | }); |
830 | |
831 | } ); </script> |
832 | |
833 | <div class="footer">Report produced by the |
834 | <a href="http://search.cpan.org/dist/Devel-NYTProf/">NYTProf 4.06</a> |
835 | Perl profiler, developed by |
836 | <a href="http://www.linkedin.com/in/timbunce">Tim Bunce</a> and |
837 | <a href="http://code.nytimes.com">Adam Kaplan</a>. |
838 | </div> |
839 | <br /><br /><br /><br /><br /><br /><br /><br /><br /><br /> |
840 | </body></html> |