Commit | Line | Data |
b2e1304d |
1 | package HTTP::Request::AsCGI; |
f1dd0792 |
2 | # ABSTRACT: Set up a CGI environment from an HTTP::Request |
b2e1304d |
3 | use strict; |
4 | use warnings; |
090cc060 |
5 | use bytes; |
b2e1304d |
6 | use base 'Class::Accessor::Fast'; |
7 | |
362ea9ac |
8 | our $VERSION = '1.1'; |
8596f5a5 |
9 | |
b332ee65 |
10 | use Carp; |
11 | use HTTP::Response; |
12 | use IO::Handle; |
13 | use IO::File; |
bb6e4a92 |
14 | use URI (); |
11454d47 |
15 | use URI::Escape (); |
b2e1304d |
16 | |
5e458489 |
17 | __PACKAGE__->mk_accessors(qw[ environment request stdin stdout stderr ]); |
18 | |
19 | # old typo |
20 | =begin Pod::Coverage |
21 | |
22 | enviroment |
23 | |
24 | =end Pod::Coverage |
25 | |
26 | =cut |
27 | |
28 | *enviroment = \&environment; |
5889d784 |
29 | |
bb6e4a92 |
30 | my %reserved = map { sprintf('%02x', ord($_)) => 1 } split //, $URI::reserved; |
31 | sub _uri_safe_unescape { |
32 | my ($s) = @_; |
8596f5a5 |
33 | $s =~ s/%([a-fA-F0-9]{2})/$reserved{lc($1)} ? "%$1" : pack('C', hex($1))/ge; |
34 | $s |
bb6e4a92 |
35 | } |
36 | |
b2e1304d |
37 | sub new { |
b332ee65 |
38 | my $class = shift; |
39 | my $request = shift; |
26e3d92b |
40 | |
b332ee65 |
41 | unless ( @_ % 2 == 0 && eval { $request->isa('HTTP::Request') } ) { |
42 | croak(qq/usage: $class->new( \$request [, key => value] )/); |
26e3d92b |
43 | } |
44 | |
b332ee65 |
45 | my $self = $class->SUPER::new( { restored => 0, setuped => 0 } ); |
46 | $self->request($request); |
47 | $self->stdin( IO::File->new_tmpfile ); |
48 | $self->stdout( IO::File->new_tmpfile ); |
b2e1304d |
49 | |
30efa07d |
50 | my $host = $request->header('Host'); |
51 | my $uri = $request->uri->clone; |
52 | $uri->scheme('http') unless $uri->scheme; |
53 | $uri->host('localhost') unless $uri->host; |
54 | $uri->port(80) unless $uri->port; |
a3875fc6 |
55 | $uri->host_port($host) unless !$host || ( $host eq $uri->host_port ); |
4e0afe7d |
56 | |
ca38286c |
57 | $uri = $uri->canonical; |
30efa07d |
58 | |
5e458489 |
59 | my $environment = { |
b2e1304d |
60 | GATEWAY_INTERFACE => 'CGI/1.1', |
30efa07d |
61 | HTTP_HOST => $uri->host_port, |
a3875fc6 |
62 | HTTPS => ( $uri->scheme eq 'https' ) ? 'ON' : 'OFF', # not in RFC 3875 |
8596f5a5 |
63 | PATH_INFO => $uri->path, |
a3875fc6 |
64 | QUERY_STRING => $uri->query || '', |
65 | SCRIPT_NAME => '/', |
66 | SERVER_NAME => $uri->host, |
67 | SERVER_PORT => $uri->port, |
68 | SERVER_PROTOCOL => $request->protocol || 'HTTP/1.1', |
69 | SERVER_SOFTWARE => "HTTP-Request-AsCGI/$VERSION", |
70 | REMOTE_ADDR => '127.0.0.1', |
71 | REMOTE_HOST => 'localhost', |
72 | REMOTE_PORT => int( rand(64000) + 1000 ), # not in RFC 3875 |
73 | REQUEST_URI => $uri->path_query, # not in RFC 3875 |
b332ee65 |
74 | REQUEST_METHOD => $request->method, |
75 | @_ |
76 | }; |
26e3d92b |
77 | |
4d6b96d8 |
78 | # RFC 3875 says PATH_INFO is not URI-encoded. That's really |
79 | # annoying for applications that you can't tell "%2F" vs "/", but |
80 | # doing the partial decoding then makes it impossible to tell |
81 | # "%252F" vs "%2F". Encoding everything is more compatible to what |
82 | # web servers like Apache or lighttpd do, anyways. |
83 | $environment->{PATH_INFO} = URI::Escape::uri_unescape($environment->{PATH_INFO}); |
8596f5a5 |
84 | |
9c216915 |
85 | foreach my $field ( $request->headers->header_field_names ) { |
b2e1304d |
86 | |
ca38286c |
87 | my $key = uc("HTTP_$field"); |
2aaf55bc |
88 | $key =~ tr/-/_/; |
ca38286c |
89 | $key =~ s/^HTTP_// if $field =~ /^Content-(Length|Type)$/; |
b2e1304d |
90 | |
5e458489 |
91 | unless ( exists $environment->{$key} ) { |
92 | $environment->{$key} = $request->headers->header($field); |
b2e1304d |
93 | } |
94 | } |
95 | |
5e458489 |
96 | unless ( $environment->{SCRIPT_NAME} eq '/' && $environment->{PATH_INFO} ) { |
97 | $environment->{PATH_INFO} =~ s/^\Q$environment->{SCRIPT_NAME}\E/\//; |
98 | $environment->{PATH_INFO} =~ s/^\/+/\//; |
26e3d92b |
99 | } |
100 | |
5e458489 |
101 | $self->environment($environment); |
b332ee65 |
102 | |
103 | return $self; |
26e3d92b |
104 | } |
105 | |
106 | sub setup { |
107 | my $self = shift; |
108 | |
5e458489 |
109 | $self->{restore}->{environment} = {%ENV}; |
26e3d92b |
110 | |
b332ee65 |
111 | binmode( $self->stdin ); |
26e3d92b |
112 | |
b332ee65 |
113 | if ( $self->request->content_length ) { |
26e3d92b |
114 | |
bd90442e |
115 | $self->stdin->print($self->request->content) |
b332ee65 |
116 | or croak("Can't write request content to stdin handle: $!"); |
b2e1304d |
117 | |
bd90442e |
118 | $self->stdin->seek(0, SEEK_SET) |
b332ee65 |
119 | or croak("Can't seek stdin handle: $!"); |
bd90442e |
120 | |
121 | $self->stdin->flush |
122 | or croak("Can't flush stdin handle: $!"); |
b2e1304d |
123 | } |
26e3d92b |
124 | |
b2c02cd0 |
125 | open( $self->{restore}->{stdin}, '<&'. STDIN->fileno ) |
b332ee65 |
126 | or croak("Can't dup stdin: $!"); |
b2e1304d |
127 | |
b2c02cd0 |
128 | open( STDIN, '<&='. $self->stdin->fileno ) |
b332ee65 |
129 | or croak("Can't open stdin: $!"); |
ca38286c |
130 | |
b332ee65 |
131 | binmode( STDIN ); |
26e3d92b |
132 | |
b332ee65 |
133 | if ( $self->stdout ) { |
26e3d92b |
134 | |
b2c02cd0 |
135 | open( $self->{restore}->{stdout}, '>&'. STDOUT->fileno ) |
b332ee65 |
136 | or croak("Can't dup stdout: $!"); |
26e3d92b |
137 | |
b2c02cd0 |
138 | open( STDOUT, '>&='. $self->stdout->fileno ) |
b332ee65 |
139 | or croak("Can't open stdout: $!"); |
76391122 |
140 | |
a3875fc6 |
141 | binmode( $self->stdout ); |
142 | binmode( STDOUT); |
143 | } |
30efa07d |
144 | |
b332ee65 |
145 | if ( $self->stderr ) { |
090cc060 |
146 | |
b2c02cd0 |
147 | open( $self->{restore}->{stderr}, '>&'. STDERR->fileno ) |
b332ee65 |
148 | or croak("Can't dup stderr: $!"); |
441eeb04 |
149 | |
b2c02cd0 |
150 | open( STDERR, '>&='. $self->stderr->fileno ) |
b332ee65 |
151 | or croak("Can't open stderr: $!"); |
26e3d92b |
152 | |
153 | binmode( $self->stderr ); |
154 | binmode( STDERR ); |
155 | } |
b2e1304d |
156 | |
9c216915 |
157 | { |
158 | no warnings 'uninitialized'; |
15e50838 |
159 | %ENV = %ENV, %{ $self->environment }; |
5889d784 |
160 | } |
161 | |
9c216915 |
162 | if ( $INC{'CGI.pm'} ) { |
163 | CGI::initialize_globals(); |
164 | } |
165 | |
b332ee65 |
166 | $self->{setuped}++; |
9c216915 |
167 | |
168 | return $self; |
5889d784 |
169 | } |
170 | |
780060e5 |
171 | sub response { |
b332ee65 |
172 | my ( $self, $callback ) = @_; |
780060e5 |
173 | |
b332ee65 |
174 | return undef unless $self->stdout; |
780060e5 |
175 | |
b332ee65 |
176 | seek( $self->stdout, 0, SEEK_SET ) |
177 | or croak("Can't seek stdout handle: $!"); |
14f243e8 |
178 | |
b332ee65 |
179 | my $headers; |
180 | while ( my $line = $self->stdout->getline ) { |
181 | $headers .= $line; |
182 | last if $headers =~ /\x0d?\x0a\x0d?\x0a$/; |
780060e5 |
183 | } |
15e50838 |
184 | |
b332ee65 |
185 | unless ( defined $headers ) { |
186 | $headers = "HTTP/1.1 500 Internal Server Error\x0d\x0a"; |
780060e5 |
187 | } |
188 | |
b332ee65 |
189 | unless ( $headers =~ /^HTTP/ ) { |
190 | $headers = "HTTP/1.1 200 OK\x0d\x0a" . $headers; |
4e0afe7d |
191 | } |
decf17dc |
192 | |
b332ee65 |
193 | my $response = HTTP::Response->parse($headers); |
194 | $response->date( time() ) unless $response->date; |
decf17dc |
195 | |
b332ee65 |
196 | my $message = $response->message; |
197 | my $status = $response->header('Status'); |
780060e5 |
198 | |
b332ee65 |
199 | if ( $message && $message =~ /^(.+)\x0d$/ ) { |
200 | $response->message($1); |
780060e5 |
201 | } |
26e3d92b |
202 | |
b332ee65 |
203 | if ( $status && $status =~ /^(\d\d\d)\s?(.+)?$/ ) { |
780060e5 |
204 | |
b332ee65 |
205 | my $code = $1; |
206 | my $message = $2 || HTTP::Status::status_message($code); |
4e0afe7d |
207 | |
b332ee65 |
208 | $response->code($code); |
209 | $response->message($message); |
4e0afe7d |
210 | } |
15e50838 |
211 | |
b332ee65 |
212 | my $length = ( stat( $self->stdout ) )[7] - tell( $self->stdout ); |
780060e5 |
213 | |
b332ee65 |
214 | if ( $response->code == 500 && !$length ) { |
4e0afe7d |
215 | |
b332ee65 |
216 | $response->content( $response->error_as_HTML ); |
217 | $response->content_type('text/html'); |
4e0afe7d |
218 | |
4d6e304a |
219 | return $response; |
780060e5 |
220 | } |
4e0afe7d |
221 | |
b332ee65 |
222 | if ($callback) { |
4d6e304a |
223 | |
b332ee65 |
224 | my $handle = $self->stdout; |
4d6e304a |
225 | |
b332ee65 |
226 | $response->content( sub { |
4e0afe7d |
227 | |
b332ee65 |
228 | if ( $handle->read( my $buffer, 4096 ) ) { |
229 | return $buffer; |
474703e4 |
230 | } |
b332ee65 |
231 | |
232 | return undef; |
233 | }); |
4d6e304a |
234 | } |
b332ee65 |
235 | else { |
4d6e304a |
236 | |
b332ee65 |
237 | my $length = 0; |
4d6e304a |
238 | |
b332ee65 |
239 | while ( $self->stdout->read( my $buffer, 4096 ) ) { |
240 | $length += length($buffer); |
241 | $response->add_content($buffer); |
242 | } |
4e0afe7d |
243 | |
b332ee65 |
244 | if ( $length && !$response->content_length ) { |
245 | $response->content_length($length); |
decf17dc |
246 | } |
780060e5 |
247 | } |
248 | |
780060e5 |
249 | return $response; |
250 | } |
251 | |
b2e1304d |
252 | sub restore { |
253 | my $self = shift; |
4e0afe7d |
254 | |
9c216915 |
255 | { |
256 | no warnings 'uninitialized'; |
5e458489 |
257 | %ENV = %{ $self->{restore}->{environment} }; |
9c216915 |
258 | } |
12852959 |
259 | |
b2c02cd0 |
260 | open( STDIN, '<&'. fileno($self->{restore}->{stdin}) ) |
b332ee65 |
261 | or croak("Can't restore stdin: $!"); |
30efa07d |
262 | |
b332ee65 |
263 | sysseek( $self->stdin, 0, SEEK_SET ) |
264 | or croak("Can't seek stdin: $!"); |
30efa07d |
265 | |
b332ee65 |
266 | if ( $self->{restore}->{stdout} ) { |
26e3d92b |
267 | |
b332ee65 |
268 | STDOUT->flush |
269 | or croak("Can't flush stdout: $!"); |
26e3d92b |
270 | |
b2c02cd0 |
271 | open( STDOUT, '>&'. fileno($self->{restore}->{stdout}) ) |
b332ee65 |
272 | or croak("Can't restore stdout: $!"); |
090cc060 |
273 | |
b332ee65 |
274 | sysseek( $self->stdout, 0, SEEK_SET ) |
275 | or croak("Can't seek stdout: $!"); |
a3875fc6 |
276 | } |
26e3d92b |
277 | |
b332ee65 |
278 | if ( $self->{restore}->{stderr} ) { |
12852959 |
279 | |
b332ee65 |
280 | STDERR->flush |
281 | or croak("Can't flush stderr: $!"); |
30efa07d |
282 | |
b2c02cd0 |
283 | open( STDERR, '>&'. fileno($self->{restore}->{stderr}) ) |
b332ee65 |
284 | or croak("Can't restore stderr: $!"); |
090cc060 |
285 | |
b332ee65 |
286 | sysseek( $self->stderr, 0, SEEK_SET ) |
287 | or croak("Can't seek stderr: $!"); |
6f5fb9a7 |
288 | } |
090cc060 |
289 | |
b332ee65 |
290 | $self->{restored}++; |
9c216915 |
291 | |
292 | return $self; |
b2e1304d |
293 | } |
294 | |
295 | sub DESTROY { |
296 | my $self = shift; |
b332ee65 |
297 | $self->restore if $self->{setuped} && !$self->{restored}; |
b2e1304d |
298 | } |
299 | |
300 | 1; |
301 | |
302 | __END__ |
303 | |
b2e1304d |
304 | =head1 SYNOPSIS |
305 | |
bd7813ac |
306 | use CGI; |
307 | use HTTP::Request; |
308 | use HTTP::Request::AsCGI; |
15e50838 |
309 | |
bd7813ac |
310 | my $request = HTTP::Request->new( GET => 'http://www.host.com/' ); |
311 | my $stdout; |
15e50838 |
312 | |
bd7813ac |
313 | { |
314 | my $c = HTTP::Request::AsCGI->new($request)->setup; |
315 | my $q = CGI->new; |
15e50838 |
316 | |
bd7813ac |
317 | print $q->header, |
318 | $q->start_html('Hello World'), |
319 | $q->h1('Hello World'), |
320 | $q->end_html; |
15e50838 |
321 | |
bd7813ac |
322 | $stdout = $c->stdout; |
15e50838 |
323 | |
5e458489 |
324 | # environment and descriptors will automatically be restored |
2d51e42f |
325 | # when $c is destructed. |
bd7813ac |
326 | } |
15e50838 |
327 | |
bd7813ac |
328 | while ( my $line = $stdout->getline ) { |
329 | print $line; |
330 | } |
15e50838 |
331 | |
b2e1304d |
332 | =head1 DESCRIPTION |
333 | |
9a0e0b26 |
334 | Provides a convenient way of setting up an CGI environment from an HTTP::Request. |
2d51e42f |
335 | |
b2e1304d |
336 | =head1 METHODS |
337 | |
15e50838 |
338 | =over 4 |
14f243e8 |
339 | |
b332ee65 |
340 | =item new ( $request [, key => value ] ) |
14f243e8 |
341 | |
9a0e0b26 |
342 | Constructor. The first argument must be a instance of HTTP::Request, followed |
343 | by optional pairs of environment key and value. |
14f243e8 |
344 | |
5e458489 |
345 | =item environment |
14f243e8 |
346 | |
15e50838 |
347 | Returns a hashref containing the environment that will be used in setup. |
b332ee65 |
348 | Changing the hashref after setup has been called will have no effect. |
14f243e8 |
349 | |
b332ee65 |
350 | =item setup |
9c216915 |
351 | |
9a0e0b26 |
352 | Sets up the environment and descriptors. |
9c216915 |
353 | |
b332ee65 |
354 | =item restore |
9c216915 |
355 | |
5e458489 |
356 | Restores the environment and descriptors. Can only be called after setup. |
9c216915 |
357 | |
b332ee65 |
358 | =item request |
9c216915 |
359 | |
b332ee65 |
360 | Returns the request given to constructor. |
9c216915 |
361 | |
b332ee65 |
362 | =item response |
9c216915 |
363 | |
b332ee65 |
364 | Returns a HTTP::Response. Can only be called after restore. |
9c216915 |
365 | |
b332ee65 |
366 | =item stdin |
9c216915 |
367 | |
b332ee65 |
368 | Accessor for handle that will be used for STDIN, must be a real seekable |
369 | handle with an file descriptor. Defaults to a tempoary IO::File instance. |
14f243e8 |
370 | |
b332ee65 |
371 | =item stdout |
14f243e8 |
372 | |
b332ee65 |
373 | Accessor for handle that will be used for STDOUT, must be a real seekable |
374 | handle with an file descriptor. Defaults to a tempoary IO::File instance. |
9c216915 |
375 | |
b332ee65 |
376 | =item stderr |
14f243e8 |
377 | |
b332ee65 |
378 | Accessor for handle that will be used for STDERR, must be a real seekable |
379 | handle with an file descriptor. |
14f243e8 |
380 | |
381 | =back |
b2e1304d |
382 | |
74fbb9dd |
383 | =head1 SEE ALSO |
384 | |
385 | =over 4 |
386 | |
387 | =item examples directory in this distribution. |
388 | |
389 | =item L<WWW::Mechanize::CGI> |
390 | |
391 | =item L<Test::WWW::Mechanize::CGI> |
392 | |
393 | =back |
394 | |
2d51e42f |
395 | =head1 THANKS TO |
17b370b0 |
396 | |
397 | Thomas L. Shinnick for his valuable win32 testing. |
398 | |
b2e1304d |
399 | =cut |