reimplement PATH_INFO unescaping
[catagits/HTTP-Request-AsCGI.git] / lib / HTTP / Request / AsCGI.pm
CommitLineData
b2e1304d 1package HTTP::Request::AsCGI;
f1dd0792 2# ABSTRACT: Set up a CGI environment from an HTTP::Request
b2e1304d 3use strict;
4use warnings;
090cc060 5use bytes;
b2e1304d 6use base 'Class::Accessor::Fast';
7
b332ee65 8use Carp;
9use HTTP::Response;
10use IO::Handle;
11use IO::File;
bb6e4a92 12use URI ();
11454d47 13use URI::Escape ();
b2e1304d 14
5e458489 15__PACKAGE__->mk_accessors(qw[ environment request stdin stdout stderr ]);
16
17# old typo
18=begin Pod::Coverage
19
20 enviroment
21
22=end Pod::Coverage
23
24=cut
25
26*enviroment = \&environment;
5889d784 27
bb6e4a92 28my %reserved = map { sprintf('%02x', ord($_)) => 1 } split //, $URI::reserved;
29sub _uri_safe_unescape {
30 my ($s) = @_;
31 $s =~ s/%([a-fA-F0-9]{2})/$reserved{lc($1)} ? "%$1" : chr(hex($1))/ge;
32 $s;
33}
34
b2e1304d 35sub new {
b332ee65 36 my $class = shift;
37 my $request = shift;
26e3d92b 38
b332ee65 39 unless ( @_ % 2 == 0 && eval { $request->isa('HTTP::Request') } ) {
40 croak(qq/usage: $class->new( \$request [, key => value] )/);
26e3d92b 41 }
42
b332ee65 43 my $self = $class->SUPER::new( { restored => 0, setuped => 0 } );
44 $self->request($request);
45 $self->stdin( IO::File->new_tmpfile );
46 $self->stdout( IO::File->new_tmpfile );
b2e1304d 47
30efa07d 48 my $host = $request->header('Host');
49 my $uri = $request->uri->clone;
50 $uri->scheme('http') unless $uri->scheme;
51 $uri->host('localhost') unless $uri->host;
52 $uri->port(80) unless $uri->port;
a3875fc6 53 $uri->host_port($host) unless !$host || ( $host eq $uri->host_port );
4e0afe7d 54
ca38286c 55 $uri = $uri->canonical;
30efa07d 56
5e458489 57 my $environment = {
b2e1304d 58 GATEWAY_INTERFACE => 'CGI/1.1',
30efa07d 59 HTTP_HOST => $uri->host_port,
a3875fc6 60 HTTPS => ( $uri->scheme eq 'https' ) ? 'ON' : 'OFF', # not in RFC 3875
bb6e4a92 61 PATH_INFO => _uri_safe_unescape($uri->path),
a3875fc6 62 QUERY_STRING => $uri->query || '',
63 SCRIPT_NAME => '/',
64 SERVER_NAME => $uri->host,
65 SERVER_PORT => $uri->port,
66 SERVER_PROTOCOL => $request->protocol || 'HTTP/1.1',
67 SERVER_SOFTWARE => "HTTP-Request-AsCGI/$VERSION",
68 REMOTE_ADDR => '127.0.0.1',
69 REMOTE_HOST => 'localhost',
70 REMOTE_PORT => int( rand(64000) + 1000 ), # not in RFC 3875
71 REQUEST_URI => $uri->path_query, # not in RFC 3875
b332ee65 72 REQUEST_METHOD => $request->method,
73 @_
74 };
26e3d92b 75
9c216915 76 foreach my $field ( $request->headers->header_field_names ) {
b2e1304d 77
ca38286c 78 my $key = uc("HTTP_$field");
2aaf55bc 79 $key =~ tr/-/_/;
ca38286c 80 $key =~ s/^HTTP_// if $field =~ /^Content-(Length|Type)$/;
b2e1304d 81
5e458489 82 unless ( exists $environment->{$key} ) {
83 $environment->{$key} = $request->headers->header($field);
b2e1304d 84 }
85 }
86
5e458489 87 unless ( $environment->{SCRIPT_NAME} eq '/' && $environment->{PATH_INFO} ) {
88 $environment->{PATH_INFO} =~ s/^\Q$environment->{SCRIPT_NAME}\E/\//;
89 $environment->{PATH_INFO} =~ s/^\/+/\//;
26e3d92b 90 }
91
5e458489 92 $self->environment($environment);
b332ee65 93
94 return $self;
26e3d92b 95}
96
97sub setup {
98 my $self = shift;
99
5e458489 100 $self->{restore}->{environment} = {%ENV};
26e3d92b 101
b332ee65 102 binmode( $self->stdin );
26e3d92b 103
b332ee65 104 if ( $self->request->content_length ) {
26e3d92b 105
bd90442e 106 $self->stdin->print($self->request->content)
b332ee65 107 or croak("Can't write request content to stdin handle: $!");
b2e1304d 108
bd90442e 109 $self->stdin->seek(0, SEEK_SET)
b332ee65 110 or croak("Can't seek stdin handle: $!");
bd90442e 111
112 $self->stdin->flush
113 or croak("Can't flush stdin handle: $!");
b2e1304d 114 }
26e3d92b 115
b2c02cd0 116 open( $self->{restore}->{stdin}, '<&'. STDIN->fileno )
b332ee65 117 or croak("Can't dup stdin: $!");
b2e1304d 118
b2c02cd0 119 open( STDIN, '<&='. $self->stdin->fileno )
b332ee65 120 or croak("Can't open stdin: $!");
ca38286c 121
b332ee65 122 binmode( STDIN );
26e3d92b 123
b332ee65 124 if ( $self->stdout ) {
26e3d92b 125
b2c02cd0 126 open( $self->{restore}->{stdout}, '>&'. STDOUT->fileno )
b332ee65 127 or croak("Can't dup stdout: $!");
26e3d92b 128
b2c02cd0 129 open( STDOUT, '>&='. $self->stdout->fileno )
b332ee65 130 or croak("Can't open stdout: $!");
76391122 131
a3875fc6 132 binmode( $self->stdout );
133 binmode( STDOUT);
134 }
30efa07d 135
b332ee65 136 if ( $self->stderr ) {
090cc060 137
b2c02cd0 138 open( $self->{restore}->{stderr}, '>&'. STDERR->fileno )
b332ee65 139 or croak("Can't dup stderr: $!");
441eeb04 140
b2c02cd0 141 open( STDERR, '>&='. $self->stderr->fileno )
b332ee65 142 or croak("Can't open stderr: $!");
26e3d92b 143
144 binmode( $self->stderr );
145 binmode( STDERR );
146 }
b2e1304d 147
9c216915 148 {
149 no warnings 'uninitialized';
5e458489 150 %ENV = %{ $self->environment };
5889d784 151 }
152
9c216915 153 if ( $INC{'CGI.pm'} ) {
154 CGI::initialize_globals();
155 }
156
b332ee65 157 $self->{setuped}++;
9c216915 158
159 return $self;
5889d784 160}
161
780060e5 162sub response {
b332ee65 163 my ( $self, $callback ) = @_;
780060e5 164
b332ee65 165 return undef unless $self->stdout;
780060e5 166
b332ee65 167 seek( $self->stdout, 0, SEEK_SET )
168 or croak("Can't seek stdout handle: $!");
14f243e8 169
b332ee65 170 my $headers;
171 while ( my $line = $self->stdout->getline ) {
172 $headers .= $line;
173 last if $headers =~ /\x0d?\x0a\x0d?\x0a$/;
780060e5 174 }
b332ee65 175
176 unless ( defined $headers ) {
177 $headers = "HTTP/1.1 500 Internal Server Error\x0d\x0a";
780060e5 178 }
179
b332ee65 180 unless ( $headers =~ /^HTTP/ ) {
181 $headers = "HTTP/1.1 200 OK\x0d\x0a" . $headers;
4e0afe7d 182 }
decf17dc 183
b332ee65 184 my $response = HTTP::Response->parse($headers);
185 $response->date( time() ) unless $response->date;
decf17dc 186
b332ee65 187 my $message = $response->message;
188 my $status = $response->header('Status');
780060e5 189
b332ee65 190 if ( $message && $message =~ /^(.+)\x0d$/ ) {
191 $response->message($1);
780060e5 192 }
26e3d92b 193
b332ee65 194 if ( $status && $status =~ /^(\d\d\d)\s?(.+)?$/ ) {
780060e5 195
b332ee65 196 my $code = $1;
197 my $message = $2 || HTTP::Status::status_message($code);
4e0afe7d 198
b332ee65 199 $response->code($code);
200 $response->message($message);
4e0afe7d 201 }
b332ee65 202
203 my $length = ( stat( $self->stdout ) )[7] - tell( $self->stdout );
780060e5 204
b332ee65 205 if ( $response->code == 500 && !$length ) {
4e0afe7d 206
b332ee65 207 $response->content( $response->error_as_HTML );
208 $response->content_type('text/html');
4e0afe7d 209
4d6e304a 210 return $response;
780060e5 211 }
4e0afe7d 212
b332ee65 213 if ($callback) {
4d6e304a 214
b332ee65 215 my $handle = $self->stdout;
4d6e304a 216
b332ee65 217 $response->content( sub {
4e0afe7d 218
b332ee65 219 if ( $handle->read( my $buffer, 4096 ) ) {
220 return $buffer;
474703e4 221 }
b332ee65 222
223 return undef;
224 });
4d6e304a 225 }
b332ee65 226 else {
4d6e304a 227
b332ee65 228 my $length = 0;
4d6e304a 229
b332ee65 230 while ( $self->stdout->read( my $buffer, 4096 ) ) {
231 $length += length($buffer);
232 $response->add_content($buffer);
233 }
4e0afe7d 234
b332ee65 235 if ( $length && !$response->content_length ) {
236 $response->content_length($length);
decf17dc 237 }
780060e5 238 }
239
780060e5 240 return $response;
241}
242
b2e1304d 243sub restore {
244 my $self = shift;
4e0afe7d 245
9c216915 246 {
247 no warnings 'uninitialized';
5e458489 248 %ENV = %{ $self->{restore}->{environment} };
9c216915 249 }
12852959 250
b2c02cd0 251 open( STDIN, '<&'. fileno($self->{restore}->{stdin}) )
b332ee65 252 or croak("Can't restore stdin: $!");
30efa07d 253
b332ee65 254 sysseek( $self->stdin, 0, SEEK_SET )
255 or croak("Can't seek stdin: $!");
30efa07d 256
b332ee65 257 if ( $self->{restore}->{stdout} ) {
26e3d92b 258
b332ee65 259 STDOUT->flush
260 or croak("Can't flush stdout: $!");
26e3d92b 261
b2c02cd0 262 open( STDOUT, '>&'. fileno($self->{restore}->{stdout}) )
b332ee65 263 or croak("Can't restore stdout: $!");
090cc060 264
b332ee65 265 sysseek( $self->stdout, 0, SEEK_SET )
266 or croak("Can't seek stdout: $!");
a3875fc6 267 }
26e3d92b 268
b332ee65 269 if ( $self->{restore}->{stderr} ) {
12852959 270
b332ee65 271 STDERR->flush
272 or croak("Can't flush stderr: $!");
30efa07d 273
b2c02cd0 274 open( STDERR, '>&'. fileno($self->{restore}->{stderr}) )
b332ee65 275 or croak("Can't restore stderr: $!");
090cc060 276
b332ee65 277 sysseek( $self->stderr, 0, SEEK_SET )
278 or croak("Can't seek stderr: $!");
6f5fb9a7 279 }
090cc060 280
b332ee65 281 $self->{restored}++;
9c216915 282
283 return $self;
b2e1304d 284}
285
286sub DESTROY {
287 my $self = shift;
b332ee65 288 $self->restore if $self->{setuped} && !$self->{restored};
b2e1304d 289}
290
2911;
292
293__END__
294
b2e1304d 295=head1 SYNOPSIS
296
bd7813ac 297 use CGI;
298 use HTTP::Request;
299 use HTTP::Request::AsCGI;
b332ee65 300
bd7813ac 301 my $request = HTTP::Request->new( GET => 'http://www.host.com/' );
302 my $stdout;
b332ee65 303
bd7813ac 304 {
305 my $c = HTTP::Request::AsCGI->new($request)->setup;
306 my $q = CGI->new;
b332ee65 307
bd7813ac 308 print $q->header,
309 $q->start_html('Hello World'),
310 $q->h1('Hello World'),
311 $q->end_html;
b332ee65 312
bd7813ac 313 $stdout = $c->stdout;
b332ee65 314
5e458489 315 # environment and descriptors will automatically be restored
2d51e42f 316 # when $c is destructed.
bd7813ac 317 }
b332ee65 318
bd7813ac 319 while ( my $line = $stdout->getline ) {
320 print $line;
321 }
b332ee65 322
b2e1304d 323=head1 DESCRIPTION
324
9a0e0b26 325Provides a convenient way of setting up an CGI environment from an HTTP::Request.
2d51e42f 326
b2e1304d 327=head1 METHODS
328
b332ee65 329=over 4
14f243e8 330
b332ee65 331=item new ( $request [, key => value ] )
14f243e8 332
9a0e0b26 333Constructor. The first argument must be a instance of HTTP::Request, followed
334by optional pairs of environment key and value.
14f243e8 335
5e458489 336=item environment
14f243e8 337
b332ee65 338Returns a hashref containing the environment that will be used in setup.
339Changing the hashref after setup has been called will have no effect.
14f243e8 340
b332ee65 341=item setup
9c216915 342
9a0e0b26 343Sets up the environment and descriptors.
9c216915 344
b332ee65 345=item restore
9c216915 346
5e458489 347Restores the environment and descriptors. Can only be called after setup.
9c216915 348
b332ee65 349=item request
9c216915 350
b332ee65 351Returns the request given to constructor.
9c216915 352
b332ee65 353=item response
9c216915 354
b332ee65 355Returns a HTTP::Response. Can only be called after restore.
9c216915 356
b332ee65 357=item stdin
9c216915 358
b332ee65 359Accessor for handle that will be used for STDIN, must be a real seekable
360handle with an file descriptor. Defaults to a tempoary IO::File instance.
14f243e8 361
b332ee65 362=item stdout
14f243e8 363
b332ee65 364Accessor for handle that will be used for STDOUT, must be a real seekable
365handle with an file descriptor. Defaults to a tempoary IO::File instance.
9c216915 366
b332ee65 367=item stderr
14f243e8 368
b332ee65 369Accessor for handle that will be used for STDERR, must be a real seekable
370handle with an file descriptor.
14f243e8 371
372=back
b2e1304d 373
74fbb9dd 374=head1 SEE ALSO
375
376=over 4
377
378=item examples directory in this distribution.
379
380=item L<WWW::Mechanize::CGI>
381
382=item L<Test::WWW::Mechanize::CGI>
383
384=back
385
2d51e42f 386=head1 THANKS TO
17b370b0 387
388Thomas L. Shinnick for his valuable win32 testing.
389
b2e1304d 390=cut