Commit | Line | Data |
d63bcdae |
1 | package Web::Dispatch::Parser; |
920d6222 |
2 | |
a5917caa |
3 | sub DEBUG () { 0 } |
4 | |
5 | BEGIN { |
d63bcdae |
6 | if ($ENV{WEB_DISPATCH_PARSER_DEBUG}) { |
a5917caa |
7 | no warnings 'redefine'; |
8 | *DEBUG = sub () { 1 } |
9 | } |
10 | } |
11 | |
d63bcdae |
12 | use Sub::Quote; |
13 | use Web::Dispatch::Predicates; |
14 | use Moo; |
15 | |
16 | has _cache => ( |
17 | is => 'lazy', default => quote_sub q{ {} } |
18 | ); |
a5917caa |
19 | |
d63bcdae |
20 | sub diag { if (DEBUG) { warn $_[0] } } |
920d6222 |
21 | |
22 | sub _blam { |
23 | my ($self, $error) = @_; |
a4ec359d |
24 | my $hat = (' ' x (pos||0)).'^'; |
920d6222 |
25 | die "Error parsing dispatch specification: ${error}\n |
26 | ${_} |
27 | ${hat} here\n"; |
28 | } |
29 | |
d63bcdae |
30 | sub parse { |
920d6222 |
31 | my ($self, $spec) = @_; |
69aaa28a |
32 | $spec =~ s/\s+//g; # whitespace is not valid |
d63bcdae |
33 | return $self->_cache->{$spec} ||= $self->_parse_spec($spec); |
c6ea9542 |
34 | } |
35 | |
36 | sub _parse_spec { |
b0420ad6 |
37 | my ($self, $spec, $nested) = @_; |
c6ea9542 |
38 | for ($_[1]) { |
920d6222 |
39 | my @match; |
920d6222 |
40 | PARSE: { do { |
c6ea9542 |
41 | push @match, $self->_parse_spec_section($_) |
920d6222 |
42 | or $self->_blam("Unable to work out what the next section is"); |
b0420ad6 |
43 | if (/\G\)/gc) { |
44 | $self->_blam("Found closing ) with no opening (") unless $nested; |
45 | last PARSE; |
46 | } |
920d6222 |
47 | last PARSE if (pos == length); |
c6ea9542 |
48 | $match[-1] = $self->_parse_spec_combinator($_, $match[-1]) |
49 | or $self->_blam('No valid combinator - expected + or |'); |
920d6222 |
50 | } until (pos == length) }; # accept trailing whitespace |
b0420ad6 |
51 | if ($nested and pos == length) { |
a4ec359d |
52 | pos = $nested - 1; |
b0420ad6 |
53 | $self->_blam("No closing ) found for opening ("); |
54 | } |
920d6222 |
55 | return $match[0] if (@match == 1); |
d63bcdae |
56 | return match_and(@match); |
920d6222 |
57 | } |
58 | } |
59 | |
9b9866ae |
60 | sub _parse_spec_combinator { |
61 | my ($self, $spec, $match) = @_; |
62 | for ($_[1]) { |
63 | |
64 | /\G\+/gc and |
65 | return $match; |
66 | |
67 | /\G\|/gc and |
68 | return do { |
69 | my @match = $match; |
70 | PARSE: { do { |
71 | push @match, $self->_parse_spec_section($_) |
72 | or $self->_blam("Unable to work out what the next section is"); |
73 | last PARSE if (pos == length); |
74 | last PARSE unless /\G\|/gc; # give up when next thing isn't | |
75 | } until (pos == length) }; # accept trailing whitespace |
d63bcdae |
76 | return match_or(@match); |
9b9866ae |
77 | }; |
78 | } |
79 | return; |
80 | } |
81 | |
920d6222 |
82 | sub _parse_spec_section { |
83 | my ($self) = @_; |
84 | for ($_[1]) { |
85 | |
86 | # GET POST PUT HEAD ... |
87 | |
88 | /\G([A-Z]+)/gc and |
e954644c |
89 | return match_method($1); |
920d6222 |
90 | |
91 | # /... |
92 | |
93 | /\G(?=\/)/gc and |
94 | return $self->_url_path_match($_); |
95 | |
c6ea9542 |
96 | # .* and .html |
97 | |
98 | /\G\.(\*|\w+)/gc and |
e954644c |
99 | return match_extension($1); |
b0420ad6 |
100 | |
2ee4ab06 |
101 | # (...) |
b0420ad6 |
102 | |
103 | /\G\(/gc and |
104 | return $self->_parse_spec($_, pos); |
2ee4ab06 |
105 | |
106 | # !something |
107 | |
108 | /\G!/gc and |
ce573717 |
109 | return match_not($self->_parse_spec_section($_)); |
920d6222 |
110 | |
9b9866ae |
111 | # ?<param spec> |
112 | /\G\?/gc and |
113 | return $self->_parse_param_handler($_, 'query'); |
53d47b78 |
114 | |
115 | # %<param spec> |
116 | /\G\%/gc and |
117 | return $self->_parse_param_handler($_, 'body'); |
c6ea9542 |
118 | } |
9b9866ae |
119 | return; # () will trigger the blam in our caller |
c6ea9542 |
120 | } |
121 | |
920d6222 |
122 | sub _url_path_match { |
123 | my ($self) = @_; |
920d6222 |
124 | for ($_[1]) { |
125 | my @path; |
e7dd1c4b |
126 | my $end = ''; |
da8429c9 |
127 | PATH: while (/\G\//gc) { |
128 | /\G\.\.\./gc |
129 | and do { |
e7dd1c4b |
130 | $end = '(/.*)'; |
da8429c9 |
131 | last PATH; |
132 | }; |
920d6222 |
133 | push @path, $self->_url_path_segment_match($_) |
134 | or $self->_blam("Couldn't parse path match segment"); |
135 | } |
4ed4fb42 |
136 | if (@path && !$end) { |
137 | length and $_ .= '(?:\.\w+)?' for $path[-1]; |
138 | } |
e7dd1c4b |
139 | my $re = '^('.join('/','',@path).')'.$end.'$'; |
da8429c9 |
140 | $re = qr/$re/; |
e7dd1c4b |
141 | if ($end) { |
142 | return match_path_strip($re); |
143 | } else { |
d63bcdae |
144 | return match_path($re); |
da8429c9 |
145 | } |
920d6222 |
146 | } |
147 | return; |
148 | } |
149 | |
150 | sub _url_path_segment_match { |
151 | my ($self) = @_; |
152 | for ($_[1]) { |
153 | # trailing / -> require / on end of URL |
6c0f599a |
154 | /\G(?:(?=[+|\)])|$)/gc and |
e7dd1c4b |
155 | return ''; |
920d6222 |
156 | # word chars only -> exact path part match |
1c4f4b78 |
157 | /\G([\w\-]+)/gc and |
920d6222 |
158 | return "\Q$1"; |
28f3dfd5 |
159 | # ** -> capture unlimited path parts |
160 | /\G\*\*/gc and |
161 | return '(.*?[^/])'; |
920d6222 |
162 | # * -> capture path part |
163 | /\G\*/gc and |
4ed4fb42 |
164 | return '([^/]+?)'; |
920d6222 |
165 | } |
166 | return (); |
167 | } |
168 | |
9b9866ae |
169 | sub _parse_param_handler { |
170 | my ($self, $spec, $type) = @_; |
171 | |
172 | require Web::Simple::ParamParser; |
173 | my $unpacker = Web::Simple::ParamParser->can("get_unpacked_${type}_from"); |
174 | |
175 | for ($_[1]) { |
eb9e0e25 |
176 | my (@required, @single, %multi, $star, $multistar, %positional, $have_kw); |
052bdd54 |
177 | my %spec; |
eb9e0e25 |
178 | my $pos_idx = 0; |
9b9866ae |
179 | PARAM: { do { |
180 | |
eb9e0e25 |
181 | # ?:foo or ?@:foo |
9b9866ae |
182 | |
eb9e0e25 |
183 | my $is_kw = /\G\:/gc; |
9b9866ae |
184 | |
185 | # ?@foo or ?@* |
186 | |
eb9e0e25 |
187 | my $multi = /\G\@/gc; |
9b9866ae |
188 | |
189 | # @* or * |
190 | |
a5917caa |
191 | if (/\G\*/gc) { |
9b9866ae |
192 | |
eb9e0e25 |
193 | $self->_blam("* is always named; no need to supply :") if $is_kw; |
194 | |
052bdd54 |
195 | if ($star) { |
196 | $self->_blam("Can only use one * or \@* in a parameter match"); |
a5917caa |
197 | } |
052bdd54 |
198 | |
199 | $spec{star} = { multi => $multi }; |
9b9866ae |
200 | } else { |
201 | |
202 | # @foo= or foo= or @foo~ or foo~ |
6c0f599a |
203 | |
9b9866ae |
204 | /\G(\w+)/gc or $self->_blam('Expected parameter name'); |
205 | |
206 | my $name = $1; |
207 | |
208 | # check for = or ~ on the end |
209 | |
210 | /\G\=/gc |
052bdd54 |
211 | ? push(@{$spec{required}||=[]}, $name) |
9b9866ae |
212 | : (/\G\~/gc or $self->_blam('Expected = or ~ after parameter name')); |
213 | |
eb9e0e25 |
214 | # record positional or keyword |
215 | |
052bdd54 |
216 | push @{$spec{$is_kw ? 'named' : 'positional'}||=[]}, |
217 | { name => $name, multi => $multi }; |
9b9866ae |
218 | } |
219 | } while (/\G\&/gc) } |
220 | |
221 | return sub { |
222 | my $raw = $unpacker->($_[0]); |
052bdd54 |
223 | Web::Dispatch::Predicates::_extract_params($raw, \%spec); |
9b9866ae |
224 | }; |
225 | } |
226 | } |
227 | |
920d6222 |
228 | 1; |