only split identifiers when we have a separator
[dbsrgits/SQL-Abstract.git] / lib / SQL / Abstract / Converter.pm
CommitLineData
a82e41dc 1package SQL::Abstract::Converter;
2
3use Carp ();
4use List::Util ();
5use Scalar::Util ();
4caa4620 6use Data::Query::ExprHelpers;
a82e41dc 7use Moo;
8b9b83ae 8use namespace::clean;
a82e41dc 9
10has renderer_will_quote => (
11 is => 'ro'
12);
13
14has lower_case => (
4caa4620 15 is => 'ro'
a82e41dc 16);
17
18has default_logic => (
19 is => 'ro', coerce => sub { uc($_[0]) }, default => sub { 'OR' }
20);
21
22has bind_meta => (
23 is => 'ro', default => sub { 1 }
24);
25
26has cmp => (is => 'ro', default => sub { '=' });
27
28has sqltrue => (is => 'ro', default => sub { '1=1' });
29has sqlfalse => (is => 'ro', default => sub { '0=1' });
30
31has special_ops => (is => 'ro', default => sub { [] });
32
33# XXX documented but I don't current fail any tests not using it
34has unary_ops => (is => 'ro', default => sub { [] });
35
36has injection_guard => (
37 is => 'ro',
38 default => sub {
39 qr/
40 \;
41 |
42 ^ \s* go \s
43 /xmi;
44 }
45);
46
47has identifier_sep => (
48 is => 'ro', default => sub { '.' },
49);
50
51has always_quote => (is => 'ro', default => sub { 1 });
52
53has convert => (is => 'ro');
54
55has array_datatypes => (is => 'ro');
56
57sub _literal_to_dq {
58 my ($self, $literal) = @_;
59 my @bind;
60 ($literal, @bind) = @$literal if ref($literal) eq 'ARRAY';
3ed3c560 61 Literal('SQL', $literal, [ $self->_bind_to_dq(@bind) ]);
a82e41dc 62}
63
64sub _bind_to_dq {
65 my ($self, @bind) = @_;
66 return unless @bind;
67 $self->bind_meta
68 ? do {
69 $self->_assert_bindval_matches_bindtype(@bind);
70 map perl_scalar_value(reverse @$_), @bind
71 }
72 : map perl_scalar_value($_), @bind
73}
74
75sub _value_to_dq {
76 my ($self, $value) = @_;
77 $self->_maybe_convert_dq(perl_scalar_value($value, our $Cur_Col_Meta));
78}
79
80sub _ident_to_dq {
81 my ($self, $ident) = @_;
82 $self->_assert_pass_injection_guard($ident)
83 unless $self->renderer_will_quote;
95516ac5 84 $self->_maybe_convert_dq(
85 Identifier(do {
86 if (my $sep = $self->identifier_sep) {
87 split /\Q$sep/, $ident
88 } else {
89 $ident
90 }
91 })
92 );
a82e41dc 93}
94
95sub _maybe_convert_dq {
96 my ($self, $dq) = @_;
97 if (my $c = $self->{where_convert}) {
4caa4620 98 Operator({ 'SQL.Naive' => 'apply' }, [
f3c68822 99 Identifier($self->_sqlcase($c)),
4caa4620 100 $dq
101 ]
102 );
a82e41dc 103 } else {
104 $dq;
105 }
106}
107
108sub _op_to_dq {
109 my ($self, $op, @args) = @_;
110 $self->_assert_pass_injection_guard($op);
4caa4620 111 Operator({ 'SQL.Naive' => $op }, \@args);
a82e41dc 112}
113
114sub _assert_pass_injection_guard {
115 if ($_[1] =~ $_[0]->{injection_guard}) {
116 my $class = ref $_[0];
117 die "Possible SQL injection attempt '$_[1]'. If this is indeed a part of the "
118 . "desired SQL use literal SQL ( \'...' or \[ '...' ] ) or supply your own "
119 . "{injection_guard} attribute to ${class}->new()"
120 }
121}
122
123sub _insert_to_dq {
124 my ($self, $table, $data, $options) = @_;
125 my (@names, @values);
126 if (ref($data) eq 'HASH') {
127 @names = sort keys %$data;
128 foreach my $k (@names) {
129 local our $Cur_Col_Meta = $k;
130 push @values, $self->_mutation_rhs_to_dq($data->{$k});
131 }
132 } elsif (ref($data) eq 'ARRAY') {
133 local our $Cur_Col_Meta;
134 @values = map $self->_mutation_rhs_to_dq($_), @$data;
135 } else {
136 die "Not handled yet";
137 }
138 my $returning;
139 if (my $r_source = $options->{returning}) {
140 $returning = [
141 map +(ref($_) ? $self->_expr_to_dq($_) : $self->_ident_to_dq($_)),
142 (ref($r_source) eq 'ARRAY' ? @$r_source : $r_source),
143 ];
144 }
4caa4620 145 Insert(
146 (@names ? ([ map $self->_ident_to_dq($_), @names ]) : undef),
147 [ \@values ],
148 $self->_table_to_dq($table),
149 ($returning ? ($returning) : undef),
150 );
a82e41dc 151}
152
153sub _mutation_rhs_to_dq {
154 my ($self, $v) = @_;
155 if (ref($v) eq 'ARRAY') {
156 if ($self->{array_datatypes}) {
157 return $self->_value_to_dq($v);
158 }
159 $v = \do { my $x = $v };
160 }
161 if (ref($v) eq 'HASH') {
162 my ($op, $arg, @rest) = %$v;
163
164 die 'Operator calls in update/insert must be in the form { -op => $arg }'
165 if (@rest or not $op =~ /^\-(.+)/);
166 }
167 return $self->_expr_to_dq($v);
168}
169
170sub _update_to_dq {
171 my ($self, $table, $data, $where) = @_;
172
173 die "Unsupported data type specified to \$sql->update"
174 unless ref $data eq 'HASH';
175
176 my @set;
177
178 foreach my $k (sort keys %$data) {
179 my $v = $data->{$k};
180 local our $Cur_Col_Meta = $k;
181 push @set, [ $self->_ident_to_dq($k), $self->_mutation_rhs_to_dq($v) ];
182 }
183
4caa4620 184 Update(
185 \@set,
186 $self->_where_to_dq($where),
187 $self->_table_to_dq($table),
188 );
a82e41dc 189}
190
191sub _source_to_dq {
192 my ($self, $table, undef, $where) = @_;
193
194 my $source_dq = $self->_table_to_dq($table);
195
196 if (my $where_dq = $self->_where_to_dq($where)) {
4caa4620 197 $source_dq = Where($where_dq, $source_dq);
a82e41dc 198 }
199
200 $source_dq;
201}
202
203sub _select_to_dq {
204 my $self = shift;
205 my ($table, $fields, $where, $order) = @_;
206
207 my $source_dq = $self->_source_to_dq(@_);
208
209 my $ordered_dq = do {
210 if ($order) {
36e3ea6c 211 $self->_order_by_to_dq($order, undef, undef, $source_dq);
a82e41dc 212 } else {
213 $source_dq
214 }
215 };
216
87af4204 217 return $self->_select_select_to_dq($fields, $ordered_dq);
a82e41dc 218}
219
87af4204 220sub _select_select_to_dq {
a82e41dc 221 my ($self, $fields, $from_dq) = @_;
222
223 $fields ||= '*';
224
4caa4620 225 Select(
226 $self->_select_field_list_to_dq($fields),
227 $from_dq,
228 );
a82e41dc 229}
230
231sub _select_field_list_to_dq {
232 my ($self, $fields) = @_;
87af4204 233 [ map $self->_select_field_to_dq($_),
234 ref($fields) eq 'ARRAY' ? @$fields : $fields ];
a82e41dc 235}
236
237sub _select_field_to_dq {
238 my ($self, $field) = @_;
87af4204 239 if (my $ref = ref($field)) {
240 if ($ref eq 'REF' and ref($$field) eq 'HASH') {
241 return $$field;
242 } else {
243 return $self->_literal_to_dq($$field);
244 }
245 }
246 return $self->_ident_to_dq($field)
a82e41dc 247}
248
249sub _delete_to_dq {
250 my ($self, $table, $where) = @_;
4caa4620 251 Delete(
252 $self->_where_to_dq($where),
253 $self->_table_to_dq($table),
254 );
a82e41dc 255}
256
257sub _where_to_dq {
258 my ($self, $where, $logic) = @_;
259
260 return undef unless defined($where);
261
e177c256 262 # if we're given a simple string assume it's a literal
263 return $self->_literal_to_dq($where) if !ref($where);
264
a82e41dc 265 # turn the convert misfeature on - only used in WHERE clauses
266 local $self->{where_convert} = $self->convert;
267
268 return $self->_expr_to_dq($where, $logic);
269}
270
271sub _expr_to_dq {
272 my ($self, $where, $logic) = @_;
273
274 if (ref($where) eq 'ARRAY') {
275 return $self->_expr_to_dq_ARRAYREF($where, $logic);
276 } elsif (ref($where) eq 'HASH') {
277 return $self->_expr_to_dq_HASHREF($where, $logic);
278 } elsif (
279 ref($where) eq 'SCALAR'
280 or (ref($where) eq 'REF' and ref($$where) eq 'ARRAY')
281 ) {
282 return $self->_literal_to_dq($$where);
62d17764 283 } elsif (ref($where) eq 'REF' and ref($$where) eq 'HASH') {
284 return $$where;
a82e41dc 285 } elsif (!ref($where) or Scalar::Util::blessed($where)) {
286 return $self->_value_to_dq($where);
287 }
288 die "Can't handle $where";
289}
290
291sub _expr_to_dq_ARRAYREF {
292 my ($self, $where, $logic) = @_;
293
294 $logic = uc($logic || $self->default_logic || 'OR');
295 $logic eq 'AND' or $logic eq 'OR' or die "unknown logic: $logic";
296
297 return unless @$where;
298
299 my ($first, @rest) = @$where;
300
301 return $self->_expr_to_dq($first) unless @rest;
302
303 my $first_dq = do {
304 if (!ref($first)) {
305 $self->_where_hashpair_to_dq($first => shift(@rest));
306 } else {
307 $self->_expr_to_dq($first);
308 }
309 };
310
311 return $self->_expr_to_dq_ARRAYREF(\@rest, $logic) unless $first_dq;
312
313 $self->_op_to_dq(
314 $logic, $first_dq, $self->_expr_to_dq_ARRAYREF(\@rest, $logic)
315 );
316}
317
318sub _expr_to_dq_HASHREF {
319 my ($self, $where, $logic) = @_;
320
321 $logic = uc($logic) if $logic;
322
323 my @dq = map {
324 $self->_where_hashpair_to_dq($_ => $where->{$_}, $logic)
325 } sort keys %$where;
326
327 return $dq[0] unless @dq > 1;
328
329 my $final = pop(@dq);
330
331 foreach my $dq (reverse @dq) {
332 $final = $self->_op_to_dq($logic||'AND', $dq, $final);
333 }
334
335 return $final;
336}
337
338sub _where_to_dq_SCALAR {
339 shift->_value_to_dq(@_);
340}
341
342sub _apply_to_dq {
343 my ($self, $op, $v) = @_;
344 my @args = map $self->_expr_to_dq($_), (ref($v) eq 'ARRAY' ? @$v : $v);
345
346 # Ok. Welcome to stupid compat code land. An SQLA expr that would in the
347 # absence of this piece of crazy render to:
348 #
349 # A( B( C( x ) ) )
350 #
351 # such as
352 #
353 # { -a => { -b => { -c => $x } } }
354 #
355 # actually needs to render to:
356 #
357 # A( B( C x ) )
358 #
359 # because SQL sucks, and databases are hateful, and SQLA is Just That DWIM.
360 #
361 # However, we don't want to catch 'A(x)' and turn it into 'A x'
362 #
363 # So the way we deal with this is to go through all our arguments, and
364 # then if the argument is -also- an apply, i.e. at least 'B', we check
365 # its arguments - and if there's only one of them, and that isn't an apply,
366 # then we convert to the bareword form. The end result should be:
367 #
368 # A( x ) -> A( x )
369 # A( B( x ) ) -> A( B x )
370 # A( B( C( x ) ) ) -> A( B( C x ) )
371 # A( B( x + y ) ) -> A( B( x + y ) )
372 # A( B( x, y ) ) -> A( B( x, y ) )
373 #
374 # If this turns out not to be quite right, please add additional tests
375 # to either 01generate.t or 02where.t *and* update this comment.
376
377 foreach my $arg (@args) {
378 if (
f3c68822 379 is_Operator($arg) and $arg->{operator}{'SQL.Naive'} eq 'apply'
380 and @{$arg->{args}} == 2 and !is_Operator($arg->{args}[1])
381
a82e41dc 382 ) {
383 $arg->{operator}{'SQL.Naive'} = (shift @{$arg->{args}})->{elements}->[0];
384 }
385 }
386 $self->_assert_pass_injection_guard($op);
387 return $self->_op_to_dq(
388 apply => $self->_ident_to_dq($op), @args
389 );
390}
391
392sub _where_hashpair_to_dq {
393 my ($self, $k, $v, $logic) = @_;
394
395 if ($k =~ /^-(.*)/s) {
396 my $op = uc($1);
397 if ($op eq 'AND' or $op eq 'OR') {
398 return $self->_expr_to_dq($v, $op);
399 } elsif ($op eq 'NEST') {
400 return $self->_expr_to_dq($v);
401 } elsif ($op eq 'NOT') {
402 return $self->_op_to_dq(NOT => $self->_expr_to_dq($v));
403 } elsif ($op eq 'BOOL') {
404 return ref($v) ? $self->_expr_to_dq($v) : $self->_ident_to_dq($v);
405 } elsif ($op eq 'NOT_BOOL') {
406 return $self->_op_to_dq(
407 NOT => ref($v) ? $self->_expr_to_dq($v) : $self->_ident_to_dq($v)
408 );
409 } elsif ($op eq 'IDENT') {
410 return $self->_ident_to_dq($v);
411 } elsif ($op eq 'VALUE') {
412 return $self->_value_to_dq($v);
413 } elsif ($op =~ /^(?:AND|OR|NEST)_?\d+/) {
414 die "Use of [and|or|nest]_N modifiers is no longer supported";
415 } else {
416 return $self->_apply_to_dq($op, $v);
417 }
418 } else {
419 local our $Cur_Col_Meta = $k;
420 if (ref($v) eq 'ARRAY') {
421 if (!@$v) {
422 return $self->_literal_to_dq($self->{sqlfalse});
423 } elsif (defined($v->[0]) && $v->[0] =~ /-(and|or)/i) {
424 return $self->_expr_to_dq_ARRAYREF([
425 map +{ $k => $_ }, @{$v}[1..$#$v]
426 ], uc($1));
427 }
428 return $self->_expr_to_dq_ARRAYREF([
429 map +{ $k => $_ }, @$v
430 ], $logic);
431 } elsif (ref($v) eq 'SCALAR' or (ref($v) eq 'REF' and ref($$v) eq 'ARRAY')) {
3ed3c560 432 return Literal('SQL', [ $self->_ident_to_dq($k), $self->_literal_to_dq($$v) ]);
a82e41dc 433 }
434 my ($op, $rhs) = do {
435 if (ref($v) eq 'HASH') {
436 if (keys %$v > 1) {
437 return $self->_expr_to_dq_ARRAYREF([
438 map +{ $k => { $_ => $v->{$_} } }, sort keys %$v
439 ], $logic||'AND');
440 }
441 my ($op, $value) = %$v;
442 s/^-//, s/_/ /g for $op;
443 if ($op =~ /^(and|or)$/i) {
444 return $self->_expr_to_dq({ $k => $value }, $op);
445 } elsif (
446 my $special_op = List::Util::first {$op =~ $_->{regex}}
447 @{$self->{special_ops}}
448 ) {
449 return $self->_literal_to_dq(
450 [ $special_op->{handler}->($k, $op, $value) ]
451 );;
452 } elsif ($op =~ /^(?:AND|OR|NEST)_?\d+$/i) {
453 die "Use of [and|or|nest]_N modifiers is no longer supported";
454 }
455 (uc($op), $value);
456 } else {
457 ($self->{cmp}, $v);
458 }
459 };
460 if ($op eq 'BETWEEN' or $op eq 'IN' or $op eq 'NOT IN' or $op eq 'NOT BETWEEN') {
461 if (ref($rhs) ne 'ARRAY') {
462 if ($op =~ /IN$/) {
463 # have to add parens if none present because -in => \"SELECT ..."
464 # got documented. mst hates everything.
465 if (ref($rhs) eq 'SCALAR') {
466 my $x = $$rhs;
467 1 while ($x =~ s/\A\s*\((.*)\)\s*\Z/$1/s);
468 $rhs = \$x;
469 } else {
470 my ($x, @rest) = @{$$rhs};
471 1 while ($x =~ s/\A\s*\((.*)\)\s*\Z/$1/s);
472 $rhs = \[ $x, @rest ];
473 }
474 }
475 return $self->_op_to_dq(
476 $op, $self->_ident_to_dq($k), $self->_literal_to_dq($$rhs)
477 );
478 }
479 return $self->_literal_to_dq($self->{sqlfalse}) unless @$rhs;
480 return $self->_op_to_dq(
481 $op, $self->_ident_to_dq($k), map $self->_expr_to_dq($_), @$rhs
482 )
483 } elsif ($op =~ s/^NOT (?!LIKE)//) {
484 return $self->_where_hashpair_to_dq(-not => { $k => { $op => $rhs } });
485 } elsif ($op eq 'IDENT') {
486 return $self->_op_to_dq(
487 $self->{cmp}, $self->_ident_to_dq($k), $self->_ident_to_dq($rhs)
488 );
489 } elsif ($op eq 'VALUE') {
490 return $self->_op_to_dq(
491 $self->{cmp}, $self->_ident_to_dq($k), $self->_value_to_dq($rhs)
492 );
493 } elsif (!defined($rhs)) {
494 my $null_op = do {
495 if ($op eq '=' or $op eq 'LIKE') {
496 'IS NULL'
497 } elsif ($op eq '!=') {
498 'IS NOT NULL'
499 } else {
500 die "Can't do undef -> NULL transform for operator ${op}";
501 }
502 };
503 return $self->_op_to_dq($null_op, $self->_ident_to_dq($k));
504 }
505 if (ref($rhs) eq 'ARRAY') {
506 if (!@$rhs) {
507 return $self->_literal_to_dq(
508 $op eq '!=' ? $self->{sqltrue} : $self->{sqlfalse}
509 );
510 } elsif (defined($rhs->[0]) and $rhs->[0] =~ /^-(and|or)$/i) {
511 return $self->_expr_to_dq_ARRAYREF([
512 map +{ $k => { $op => $_ } }, @{$rhs}[1..$#$rhs]
513 ], uc($1));
514 } elsif ($op =~ /^-(?:AND|OR|NEST)_?\d+/) {
515 die "Use of [and|or|nest]_N modifiers is no longer supported";
516 }
517 return $self->_expr_to_dq_ARRAYREF([
518 map +{ $k => { $op => $_ } }, @$rhs
519 ]);
520 }
521 return $self->_op_to_dq(
522 $op, $self->_ident_to_dq($k), $self->_expr_to_dq($rhs)
523 );
524 }
525}
526
527sub _order_by_to_dq {
36e3ea6c 528 my ($self, $arg, $dir, $nulls, $from) = @_;
a82e41dc 529
530 return unless $arg;
531
4caa4620 532 my $dq = Order(
533 undef,
534 (defined($dir) ? (!!($dir =~ /desc/i)) : undef),
36e3ea6c 535 (defined($nulls) ? ($nulls =~ /first/i ? 1 : -1) : undef),
4caa4620 536 ($from ? ($from) : undef),
537 );
a82e41dc 538
539 if (!ref($arg)) {
540 $dq->{by} = $self->_ident_to_dq($arg);
541 } elsif (ref($arg) eq 'ARRAY') {
542 return unless @$arg;
543 local our $Order_Inner unless our $Order_Recursing;
544 local $Order_Recursing = 1;
545 my ($outer, $inner);
546 foreach my $member (@$arg) {
547 local $Order_Inner;
36e3ea6c 548 my $next = $self->_order_by_to_dq($member, $dir, $nulls, $from);
a82e41dc 549 $outer ||= $next;
550 $inner->{from} = $next if $inner;
551 $inner = $Order_Inner || $next;
552 }
553 $Order_Inner = $inner;
554 return $outer;
555 } elsif (ref($arg) eq 'REF' and ref($$arg) eq 'ARRAY') {
556 $dq->{by} = $self->_literal_to_dq($$arg);
557 } elsif (ref($arg) eq 'SCALAR') {
8b9b83ae 558
559 # < mst> right, but if it doesn't match that, it goes "ok, right, not sure,
560 # totally leaving this untouched as a literal"
561 # < mst> so I -think- it's relatively robust
562 # < ribasushi> right, it's relatively safe then
563 # < ribasushi> is this regex centralized?
564 # < mst> it only exists in _order_by_to_dq in SQL::Abstract::Converter
565 # < mst> it only exists because you were kind enough to support new
566 # dbihacks crack combined with old literal order_by crack
567 # < ribasushi> heh :)
568
daf6f830 569 if (my ($ident, $dir) = $$arg =~ /^(\w+)(?:\s+(desc|asc))?$/i) {
3d82b6c9 570 $dq->{by} = $self->_ident_to_dq($ident);
571 $dq->{reverse} = 1 if $dir and lc($dir) eq 'desc';
572 } else {
573 $dq->{by} = $self->_literal_to_dq($$arg);
574 }
a82e41dc 575 } elsif (ref($arg) eq 'HASH') {
36e3ea6c 576 return () unless %$arg;
577
578 my ($direction, $val);
579 foreach my $key (keys %$arg) {
580 if ( $key =~ /^-(desc|asc)/i ) {
581 die "hash passed to _order_by_to_dq must have exactly one of -desc or -asc"
582 if defined $direction;
583 $direction = $1;
584 $val = $arg->{$key};
585 } elsif ($key =~ /^-nulls$/i) {
586 $nulls = $arg->{$key};
0f87e4f0 587 die "invalid value for -nulls" unless $nulls =~ /^(?:first|last)$/i;
36e3ea6c 588 } else {
589 die "invalid key in hash passed to _order_by_to_dq";
590 }
591 }
a82e41dc 592
36e3ea6c 593 die "hash passed to _order_by_to_dq must have exactly one of -desc or -asc"
594 unless defined $direction;
a82e41dc 595
36e3ea6c 596 return $self->_order_by_to_dq($val, $direction, $nulls, $from);
a82e41dc 597 } else {
598 die "Can't handle $arg in _order_by_to_dq";
599 }
600 return $dq;
601}
602
603sub _table_to_dq {
604 my ($self, $from) = @_;
605 if (ref($from) eq 'ARRAY') {
606 die "Empty FROM list" unless my @f = @$from;
607 my $dq = $self->_table_to_dq(shift @f);
608 while (my $x = shift @f) {
4caa4620 609 $dq = Join(
610 $dq,
611 $self->_table_to_dq($x),
612 );
a82e41dc 613 }
614 $dq;
615 } elsif (ref($from) eq 'SCALAR' or (ref($from) eq 'REF')) {
616 $self->_literal_to_dq($$from);
617 } else {
618 $self->_ident_to_dq($from);
619 }
620}
621
622# And bindtype
623sub _bindtype (@) {
624 #my ($self, $col, @vals) = @_;
625
626 #LDNOTE : changed original implementation below because it did not make
627 # sense when bindtype eq 'columns' and @vals > 1.
628# return $self->{bindtype} eq 'columns' ? [ $col, @vals ] : @vals;
629
630 # called often - tighten code
631 return $_[0]->bind_meta
632 ? map {[$_[1], $_]} @_[2 .. $#_]
633 : @_[2 .. $#_]
634 ;
635}
636
637# Dies if any element of @bind is not in [colname => value] format
638# if bindtype is 'columns'.
639sub _assert_bindval_matches_bindtype {
640# my ($self, @bind) = @_;
641 my $self = shift;
642 if ($self->bind_meta) {
643 for (@_) {
644 if (!defined $_ || ref($_) ne 'ARRAY' || @$_ != 2) {
645 die "bindtype 'columns' selected, you need to pass: [column_name => bind_value]"
646 }
647 }
648 }
649}
650
651# Fix SQL case, if so requested
652sub _sqlcase {
653 return $_[0]->lower_case ? $_[1] : uc($_[1]);
654}
655
6561;