fixed _refkind for \$object, \\$object. Added tests for _refkind
[dbsrgits/SQL-Abstract.git] / lib / SQL / Abstract.pm
CommitLineData
96449e8e 1package SQL::Abstract; # see doc at end of file
2
3# LDNOTE : this code is heavy refactoring from original SQLA.
4# Several design decisions will need discussion during
5# the test / diffusion / acceptance phase; those are marked with flag
6# 'LDNOTE' (note by laurent.dami AT free.fr)
7
8use Carp;
9use strict;
10use warnings;
fffe6900 11use List::Util qw/first/;
12use Scalar::Util qw/blessed/;
96449e8e 13
14#======================================================================
15# GLOBALS
16#======================================================================
17
18our $VERSION = '1.49_01';
7479e27e 19$VERSION = eval $VERSION; # numify for warning-free dev releases
20
96449e8e 21
22our $AUTOLOAD;
23
24# special operators (-in, -between). May be extended/overridden by user.
25# See section WHERE: BUILTIN SPECIAL OPERATORS below for implementation
26my @BUILTIN_SPECIAL_OPS = (
27 {regex => qr/^(not )?between$/i, handler => \&_where_field_BETWEEN},
28 {regex => qr/^(not )?in$/i, handler => \&_where_field_IN},
29);
30
31#======================================================================
32# DEBUGGING AND ERROR REPORTING
33#======================================================================
34
35sub _debug {
36 return unless $_[0]->{debug}; shift; # a little faster
37 my $func = (caller(1))[3];
38 warn "[$func] ", @_, "\n";
39}
40
41sub belch (@) {
42 my($func) = (caller(1))[3];
43 carp "[$func] Warning: ", @_;
44}
45
46sub puke (@) {
47 my($func) = (caller(1))[3];
48 croak "[$func] Fatal: ", @_;
49}
50
51
52#======================================================================
53# NEW
54#======================================================================
55
56sub new {
57 my $self = shift;
58 my $class = ref($self) || $self;
59 my %opt = (ref $_[0] eq 'HASH') ? %{$_[0]} : @_;
60
61 # choose our case by keeping an option around
62 delete $opt{case} if $opt{case} && $opt{case} ne 'lower';
63
64 # default logic for interpreting arrayrefs
65 $opt{logic} = uc $opt{logic} || 'OR';
66
67 # how to return bind vars
68 # LDNOTE: changed nwiger code : why this 'delete' ??
69 # $opt{bindtype} ||= delete($opt{bind_type}) || 'normal';
70 $opt{bindtype} ||= 'normal';
71
72 # default comparison is "=", but can be overridden
73 $opt{cmp} ||= '=';
74
75 # try to recognize which are the 'equality' and 'unequality' ops
76 # (temporary quickfix, should go through a more seasoned API)
77 $opt{equality_op} = qr/^(\Q$opt{cmp}\E|is|(is\s+)?like)$/i;
78 $opt{inequality_op} = qr/^(!=|<>|(is\s+)?not(\s+like)?)$/i;
79
80 # SQL booleans
81 $opt{sqltrue} ||= '1=1';
82 $opt{sqlfalse} ||= '0=1';
83
84 # special operators
85 $opt{special_ops} ||= [];
86 push @{$opt{special_ops}}, @BUILTIN_SPECIAL_OPS;
87
88 return bless \%opt, $class;
89}
90
91
92
93#======================================================================
94# INSERT methods
95#======================================================================
96
97sub insert {
98 my $self = shift;
99 my $table = $self->_table(shift);
100 my $data = shift || return;
101
102 my $method = $self->_METHOD_FOR_refkind("_insert", $data);
103 my ($sql, @bind) = $self->$method($data);
104 $sql = join " ", $self->_sqlcase('insert into'), $table, $sql;
105 return wantarray ? ($sql, @bind) : $sql;
106}
107
108sub _insert_HASHREF { # explicit list of fields and then values
109 my ($self, $data) = @_;
110
111 my @fields = sort keys %$data;
112
113 my ($sql, @bind);
114 { # get values (need temporary override of bindtype to avoid an error)
115 local $self->{bindtype} = 'normal';
116 ($sql, @bind) = $self->_insert_ARRAYREF([@{$data}{@fields}]);
117 }
118
119 # if necessary, transform values according to 'bindtype'
120 if ($self->{bindtype} eq 'columns') {
121 for my $i (0 .. $#fields) {
122 ($bind[$i]) = $self->_bindtype($fields[$i], $bind[$i]);
123 }
124 }
125
126 # assemble SQL
127 $_ = $self->_quote($_) foreach @fields;
128 $sql = "( ".join(", ", @fields).") ".$sql;
129
130 return ($sql, @bind);
131}
132
133sub _insert_ARRAYREF { # just generate values(?,?) part (no list of fields)
134 my ($self, $data) = @_;
135
136 # no names (arrayref) so can't generate bindtype
137 $self->{bindtype} ne 'columns'
138 or belch "can't do 'columns' bindtype when called with arrayref";
139
140 my (@values, @all_bind);
141 for my $v (@$data) {
142
143 $self->_SWITCH_refkind($v, {
144
145 ARRAYREF => sub {
146 if ($self->{array_datatypes}) { # if array datatype are activated
147 push @values, '?';
148 }
149 else { # else literal SQL with bind
150 my ($sql, @bind) = @$v;
151 push @values, $sql;
152 push @all_bind, @bind;
153 }
154 },
155
156 ARRAYREFREF => sub { # literal SQL with bind
157 my ($sql, @bind) = @${$v};
158 push @values, $sql;
159 push @all_bind, @bind;
160 },
161
162 # THINK : anything useful to do with a HASHREF ?
163
164 SCALARREF => sub { # literal SQL without bind
165 push @values, $$v;
166 },
167
168 SCALAR_or_UNDEF => sub {
169 push @values, '?';
170 push @all_bind, $v;
171 },
172
173 });
174
175 }
176
177 my $sql = $self->_sqlcase('values')." ( ".join(", ", @values)." )";
178 return ($sql, @all_bind);
179}
180
181
182sub _insert_ARRAYREFREF { # literal SQL with bind
183 my ($self, $data) = @_;
184 return @${$data};
185}
186
187
188sub _insert_SCALARREF { # literal SQL without bind
189 my ($self, $data) = @_;
190
191 return ($$data);
192}
193
194
195
196#======================================================================
197# UPDATE methods
198#======================================================================
199
200
201sub update {
202 my $self = shift;
203 my $table = $self->_table(shift);
204 my $data = shift || return;
205 my $where = shift;
206
207 # first build the 'SET' part of the sql statement
208 my (@set, @all_bind);
209 puke "Unsupported data type specified to \$sql->update"
210 unless ref $data eq 'HASH';
211
212 for my $k (sort keys %$data) {
213 my $v = $data->{$k};
214 my $r = ref $v;
215 my $label = $self->_quote($k);
216
217 $self->_SWITCH_refkind($v, {
218 ARRAYREF => sub {
219 if ($self->{array_datatypes}) { # array datatype
220 push @set, "$label = ?";
221 push @all_bind, $self->_bindtype($k, $v);
222 }
223 else { # literal SQL with bind
224 my ($sql, @bind) = @$v;
225 push @set, "$label = $sql";
226 push @all_bind, $self->_bindtype($k, @bind);
227 }
228 },
229 ARRAYREFREF => sub { # literal SQL with bind
230 my ($sql, @bind) = @${$v};
231 push @set, "$label = $sql";
232 push @all_bind, $self->_bindtype($k, @bind);
233 },
234 SCALARREF => sub { # literal SQL without bind
235 push @set, "$label = $$v";
236 },
237 SCALAR_or_UNDEF => sub {
238 push @set, "$label = ?";
239 push @all_bind, $self->_bindtype($k, $v);
240 },
241 });
242 }
243
244 # generate sql
245 my $sql = $self->_sqlcase('update') . " $table " . $self->_sqlcase('set ')
246 . join ', ', @set;
247
248 if ($where) {
249 my($where_sql, @where_bind) = $self->where($where);
250 $sql .= $where_sql;
251 push @all_bind, @where_bind;
252 }
253
254 return wantarray ? ($sql, @all_bind) : $sql;
255}
256
257
258
259
260#======================================================================
261# SELECT
262#======================================================================
263
264
265sub select {
266 my $self = shift;
267 my $table = $self->_table(shift);
268 my $fields = shift || '*';
269 my $where = shift;
270 my $order = shift;
271
272 my($where_sql, @bind) = $self->where($where, $order);
273
274 my $f = (ref $fields eq 'ARRAY') ? join ', ', map { $self->_quote($_) } @$fields
275 : $fields;
276 my $sql = join(' ', $self->_sqlcase('select'), $f,
277 $self->_sqlcase('from'), $table)
278 . $where_sql;
279
280 return wantarray ? ($sql, @bind) : $sql;
281}
282
283#======================================================================
284# DELETE
285#======================================================================
286
287
288sub delete {
289 my $self = shift;
290 my $table = $self->_table(shift);
291 my $where = shift;
292
293
294 my($where_sql, @bind) = $self->where($where);
295 my $sql = $self->_sqlcase('delete from') . " $table" . $where_sql;
296
297 return wantarray ? ($sql, @bind) : $sql;
298}
299
300
301#======================================================================
302# WHERE: entry point
303#======================================================================
304
305
306
307# Finally, a separate routine just to handle WHERE clauses
308sub where {
309 my ($self, $where, $order) = @_;
310
311 # where ?
312 my ($sql, @bind) = $self->_recurse_where($where);
313 $sql = $sql ? $self->_sqlcase(' where ') . "( $sql )" : '';
314
315 # order by?
316 if ($order) {
317 $sql .= $self->_order_by($order);
318 }
319
320 return wantarray ? ($sql, @bind) : $sql;
321}
322
323
324sub _recurse_where {
325 my ($self, $where, $logic) = @_;
326
327 # dispatch on appropriate method according to refkind of $where
328 my $method = $self->_METHOD_FOR_refkind("_where", $where);
311b2151 329
330
331 my ($sql, @bind) = $self->$method($where, $logic);
332
333 # DBIx::Class directly calls _recurse_where in scalar context, so
334 # we must implement it, even if not in the official API
335 return wantarray ? ($sql, @bind) : $sql;
96449e8e 336}
337
338
339
340#======================================================================
341# WHERE: top-level ARRAYREF
342#======================================================================
343
344
345sub _where_ARRAYREF {
346 my ($self, $where, $logic) = @_;
347
348 $logic = uc($logic || $self->{logic});
349 $logic eq 'AND' or $logic eq 'OR' or puke "unknown logic: $logic";
350
351 my @clauses = @$where;
352
353 # if the array starts with [-and|or => ...], recurse with that logic
354 my $first = $clauses[0] || '';
355 if ($first =~ /^-(and|or)/i) {
356 $logic = $1;
357 shift @clauses;
358 return $self->_where_ARRAYREF(\@clauses, $logic);
359 }
360
361 #otherwise..
362 my (@sql_clauses, @all_bind);
363
364 # need to use while() so can shift() for pairs
365 while (my $el = shift @clauses) {
366
367 # switch according to kind of $el and get corresponding ($sql, @bind)
368 my ($sql, @bind) = $self->_SWITCH_refkind($el, {
369
370 # skip empty elements, otherwise get invalid trailing AND stuff
371 ARRAYREF => sub {$self->_recurse_where($el) if @$el},
372
373 HASHREF => sub {$self->_recurse_where($el, 'and') if %$el},
374 # LDNOTE : previous SQLA code for hashrefs was creating a dirty
375 # side-effect: the first hashref within an array would change
376 # the global logic to 'AND'. So [ {cond1, cond2}, [cond3, cond4] ]
377 # was interpreted as "(cond1 AND cond2) OR (cond3 AND cond4)",
378 # whereas it should be "(cond1 AND cond2) OR (cond3 OR cond4)".
379
380 SCALARREF => sub { ($$el); },
381
382 SCALAR => sub {# top-level arrayref with scalars, recurse in pairs
383 $self->_recurse_where({$el => shift(@clauses)})},
384
385 UNDEF => sub {puke "not supported : UNDEF in arrayref" },
386 });
387
4b7b6026 388 if ($sql) {
389 push @sql_clauses, $sql;
390 push @all_bind, @bind;
391 }
96449e8e 392 }
393
394 return $self->_join_sql_clauses($logic, \@sql_clauses, \@all_bind);
395}
396
397
398
399#======================================================================
400# WHERE: top-level HASHREF
401#======================================================================
402
403sub _where_HASHREF {
404 my ($self, $where) = @_;
405 my (@sql_clauses, @all_bind);
406
407 # LDNOTE : don't really know why we need to sort keys
408 for my $k (sort keys %$where) {
409 my $v = $where->{$k};
410
411 # ($k => $v) is either a special op or a regular hashpair
412 my ($sql, @bind) = ($k =~ /^-(.+)/) ? $self->_where_op_in_hash($1, $v)
413 : do {
414 my $method = $self->_METHOD_FOR_refkind("_where_hashpair", $v);
415 $self->$method($k, $v);
416 };
417
418 push @sql_clauses, $sql;
419 push @all_bind, @bind;
420 }
421
422 return $self->_join_sql_clauses('and', \@sql_clauses, \@all_bind);
423}
424
425
426sub _where_op_in_hash {
427 my ($self, $op, $v) = @_;
428
429 $op =~ /^(AND|OR|NEST)[_\d]*/i
430 or puke "unknown operator: -$op";
431 $op = uc($1); # uppercase, remove trailing digits
432 $self->_debug("OP(-$op) within hashref, recursing...");
433
434 $self->_SWITCH_refkind($v, {
435
436 ARRAYREF => sub {
437 # LDNOTE : should deprecate {-or => [...]} and {-and => [...]}
438 # because they are misleading; the only proper way would be
439 # -nest => [-or => ...], -nest => [-and ...]
440 return $self->_where_ARRAYREF($v, $op eq 'NEST' ? '' : $op);
441 },
442
443 HASHREF => sub {
444 if ($op eq 'OR') {
445 belch "-or => {...} should be -nest => [...]";
446 return $self->_where_ARRAYREF([%$v], 'OR');
447 }
448 else { # NEST | AND
449 return $self->_where_HASHREF($v);
450 }
451 },
452
453 SCALARREF => sub { # literal SQL
454 $op eq 'NEST'
455 or puke "-$op => \\\$scalar not supported, use -nest => ...";
456 return ($$v);
457 },
458
459 ARRAYREFREF => sub { # literal SQL
460 $op eq 'NEST'
461 or puke "-$op => \\[..] not supported, use -nest => ...";
462 return @{${$v}};
463 },
464
465 SCALAR => sub { # permissively interpreted as SQL
466 $op eq 'NEST'
467 or puke "-$op => 'scalar' not supported, use -nest => \\'scalar'";
468 belch "literal SQL should be -nest => \\'scalar' "
469 . "instead of -nest => 'scalar' ";
470 return ($v);
471 },
472
473 UNDEF => sub {
474 puke "-$op => undef not supported";
475 },
476 });
477}
478
479
480sub _where_hashpair_ARRAYREF {
481 my ($self, $k, $v) = @_;
482
483 if( @$v ) {
484 my @v = @$v; # need copy because of shift below
485 $self->_debug("ARRAY($k) means distribute over elements");
486
487 # put apart first element if it is an operator (-and, -or)
488 my $op = $v[0] =~ /^-/ ? shift @v : undef;
489 $self->_debug("OP($op) reinjected into the distributed array") if $op;
490
491 my @distributed = map { {$k => $_} } @v;
492 unshift @distributed, $op if $op;
493
494 return $self->_recurse_where(\@distributed);
495 }
496 else {
497 # LDNOTE : not sure of this one. What does "distribute over nothing" mean?
498 $self->_debug("empty ARRAY($k) means 0=1");
499 return ($self->{sqlfalse});
500 }
501}
502
503sub _where_hashpair_HASHREF {
504 my ($self, $k, $v) = @_;
505
506 my (@all_sql, @all_bind);
507
508 for my $op (sort keys %$v) {
509 my $val = $v->{$op};
510
511 # put the operator in canonical form
512 $op =~ s/^-//; # remove initial dash
513 $op =~ tr/_/ /; # underscores become spaces
514 $op =~ s/^\s+//; # no initial space
515 $op =~ s/\s+$//; # no final space
516 $op =~ s/\s+/ /; # multiple spaces become one
517
518 my ($sql, @bind);
519
520 # CASE: special operators like -in or -between
521 my $special_op = first {$op =~ $_->{regex}} @{$self->{special_ops}};
522 if ($special_op) {
523 ($sql, @bind) = $special_op->{handler}->($self, $k, $op, $val);
524 }
525
526 # CASE: col => {op => \@vals}
527 elsif (ref $val eq 'ARRAY') {
528 ($sql, @bind) = $self->_where_field_op_ARRAYREF($k, $op, $val);
529 }
530
531 # CASE: col => {op => undef} : sql "IS (NOT)? NULL"
532 elsif (! defined($val)) {
533 my $is = ($op =~ $self->{equality_op}) ? 'is' :
534 ($op =~ $self->{inequality_op}) ? 'is not' :
535 puke "unexpected operator '$op' with undef operand";
536 $sql = $self->_quote($k) . $self->_sqlcase(" $is null");
537 }
538
539 # CASE: col => {op => $scalar}
540 else {
541 $sql = join ' ', $self->_convert($self->_quote($k)),
542 $self->_sqlcase($op),
543 $self->_convert('?');
544 @bind = $self->_bindtype($k, $val);
545 }
546
547 push @all_sql, $sql;
548 push @all_bind, @bind;
549 }
550
551 return $self->_join_sql_clauses('and', \@all_sql, \@all_bind);
552}
553
554
555
556sub _where_field_op_ARRAYREF {
557 my ($self, $k, $op, $vals) = @_;
558
559 if(@$vals) {
560 $self->_debug("ARRAY($vals) means multiple elements: [ @$vals ]");
561
562
563
564 # LDNOTE : change the distribution logic when
565 # $op =~ $self->{inequality_op}, because of Morgan laws :
566 # with {field => {'!=' => [22, 33]}}, it would be ridiculous to generate
567 # WHERE field != 22 OR field != 33 : the user probably means
568 # WHERE field != 22 AND field != 33.
569 my $logic = ($op =~ $self->{inequality_op}) ? 'AND' : 'OR';
570
571 # distribute $op over each member of @$vals
572 return $self->_recurse_where([map { {$k => {$op, $_}} } @$vals], $logic);
573
574 }
575 else {
576 # try to DWIM on equality operators
577 # LDNOTE : not 100% sure this is the correct thing to do ...
578 return ($self->{sqlfalse}) if $op =~ $self->{equality_op};
579 return ($self->{sqltrue}) if $op =~ $self->{inequality_op};
580
581 # otherwise
582 puke "operator '$op' applied on an empty array (field '$k')";
583 }
584}
585
586
587sub _where_hashpair_SCALARREF {
588 my ($self, $k, $v) = @_;
589 $self->_debug("SCALAR($k) means literal SQL: $$v");
590 my $sql = $self->_quote($k) . " " . $$v;
591 return ($sql);
592}
593
594sub _where_hashpair_ARRAYREFREF {
595 my ($self, $k, $v) = @_;
596 $self->_debug("REF($k) means literal SQL: @${$v}");
597 my ($sql, @bind) = @${$v};
598 $sql = $self->_quote($k) . " " . $sql;
599 @bind = $self->_bindtype($k, @bind);
600 return ($sql, @bind );
601}
602
603sub _where_hashpair_SCALAR {
604 my ($self, $k, $v) = @_;
605 $self->_debug("NOREF($k) means simple key=val: $k $self->{cmp} $v");
606 my $sql = join ' ', $self->_convert($self->_quote($k)),
607 $self->_sqlcase($self->{cmp}),
608 $self->_convert('?');
609 my @bind = $self->_bindtype($k, $v);
610 return ( $sql, @bind);
611}
612
613
614sub _where_hashpair_UNDEF {
615 my ($self, $k, $v) = @_;
616 $self->_debug("UNDEF($k) means IS NULL");
617 my $sql = $self->_quote($k) . $self->_sqlcase(' is null');
618 return ($sql);
619}
620
621#======================================================================
622# WHERE: TOP-LEVEL OTHERS (SCALARREF, SCALAR, UNDEF)
623#======================================================================
624
625
626sub _where_SCALARREF {
627 my ($self, $where) = @_;
628
629 # literal sql
630 $self->_debug("SCALAR(*top) means literal SQL: $$where");
631 return ($$where);
632}
633
634
635sub _where_SCALAR {
636 my ($self, $where) = @_;
637
638 # literal sql
639 $self->_debug("NOREF(*top) means literal SQL: $where");
640 return ($where);
641}
642
643
644sub _where_UNDEF {
645 my ($self) = @_;
646 return ();
647}
648
649
650#======================================================================
651# WHERE: BUILTIN SPECIAL OPERATORS (-in, -between)
652#======================================================================
653
654
655sub _where_field_BETWEEN {
656 my ($self, $k, $op, $vals) = @_;
657
658 ref $vals eq 'ARRAY' && @$vals == 2
659 or puke "special op 'between' requires an arrayref of two values";
660
661 my ($label) = $self->_convert($self->_quote($k));
662 my ($placeholder) = $self->_convert('?');
663 my $and = $self->_sqlcase('and');
664 $op = $self->_sqlcase($op);
665
666 my $sql = "( $label $op $placeholder $and $placeholder )";
667 my @bind = $self->_bindtype($k, @$vals);
668 return ($sql, @bind)
669}
670
671
672sub _where_field_IN {
673 my ($self, $k, $op, $vals) = @_;
674
675 # backwards compatibility : if scalar, force into an arrayref
676 $vals = [$vals] if defined $vals && ! ref $vals;
677
678 ref $vals eq 'ARRAY'
679 or puke "special op 'in' requires an arrayref";
680
681 my ($label) = $self->_convert($self->_quote($k));
682 my ($placeholder) = $self->_convert('?');
683 my $and = $self->_sqlcase('and');
684 $op = $self->_sqlcase($op);
685
686 if (@$vals) { # nonempty list
687 my $placeholders = join ", ", (($placeholder) x @$vals);
688 my $sql = "$label $op ( $placeholders )";
689 my @bind = $self->_bindtype($k, @$vals);
690
691 return ($sql, @bind);
692 }
693 else { # empty list : some databases won't understand "IN ()", so DWIM
694 my $sql = ($op =~ /\bnot\b/i) ? $self->{sqltrue} : $self->{sqlfalse};
695 return ($sql);
696 }
697}
698
699
700
701
702
703
704#======================================================================
705# ORDER BY
706#======================================================================
707
708sub _order_by {
709 my ($self, $arg) = @_;
710
711 # construct list of ordering instructions
712 my @order = $self->_SWITCH_refkind($arg, {
713
714 ARRAYREF => sub {
715 map {$self->_SWITCH_refkind($_, {
716 SCALAR => sub {$self->_quote($_)},
fffe6900 717 UNDEF => sub {},
96449e8e 718 SCALARREF => sub {$$_}, # literal SQL, no quoting
719 HASHREF => sub {$self->_order_by_hash($_)}
720 }) } @$arg;
721 },
722
723 SCALAR => sub {$self->_quote($arg)},
b6475fb1 724 UNDEF => sub {},
96449e8e 725 SCALARREF => sub {$$arg}, # literal SQL, no quoting
726 HASHREF => sub {$self->_order_by_hash($arg)},
727
728 });
729
730 # build SQL
731 my $order = join ', ', @order;
732 return $order ? $self->_sqlcase(' order by')." $order" : '';
733}
734
735
736sub _order_by_hash {
737 my ($self, $hash) = @_;
738
739 # get first pair in hash
740 my ($key, $val) = each %$hash;
741
742 # check if one pair was found and no other pair in hash
743 $key && !(each %$hash)
744 or puke "hash passed to _order_by must have exactly one key (-desc or -asc)";
745
746 my ($order) = ($key =~ /^-(desc|asc)/i)
747 or puke "invalid key in _order_by hash : $key";
748
749 return $self->_quote($val) ." ". $self->_sqlcase($order);
750}
751
752
753
754#======================================================================
755# DATASOURCE (FOR NOW, JUST PLAIN TABLE OR LIST OF TABLES)
756#======================================================================
757
758sub _table {
759 my $self = shift;
760 my $from = shift;
761 $self->_SWITCH_refkind($from, {
762 ARRAYREF => sub {join ', ', map { $self->_quote($_) } @$from;},
763 SCALAR => sub {$self->_quote($from)},
764 SCALARREF => sub {$$from},
765 ARRAYREFREF => sub {join ', ', @$from;},
766 });
767}
768
769
770#======================================================================
771# UTILITY FUNCTIONS
772#======================================================================
773
774sub _quote {
775 my $self = shift;
776 my $label = shift;
777
778 $label or puke "can't quote an empty label";
779
780 # left and right quote characters
781 my ($ql, $qr, @other) = $self->_SWITCH_refkind($self->{quote_char}, {
782 SCALAR => sub {($self->{quote_char}, $self->{quote_char})},
783 ARRAYREF => sub {@{$self->{quote_char}}},
784 UNDEF => sub {()},
785 });
786 not @other
787 or puke "quote_char must be an arrayref of 2 values";
788
789 # no quoting if no quoting chars
790 $ql or return $label;
791
792 # no quoting for literal SQL
793 return $$label if ref($label) eq 'SCALAR';
794
795 # separate table / column (if applicable)
796 my $sep = $self->{name_sep} || '';
797 my @to_quote = $sep ? split /\Q$sep\E/, $label : ($label);
798
799 # do the quoting, except for "*" or for `table`.*
800 my @quoted = map { $_ eq '*' ? $_: $ql.$_.$qr} @to_quote;
801
802 # reassemble and return.
803 return join $sep, @quoted;
804}
805
806
807# Conversion, if applicable
808sub _convert ($) {
809 my ($self, $arg) = @_;
810
811# LDNOTE : modified the previous implementation below because
812# it was not consistent : the first "return" is always an array,
813# the second "return" is context-dependent. Anyway, _convert
814# seems always used with just a single argument, so make it a
815# scalar function.
816# return @_ unless $self->{convert};
817# my $conv = $self->_sqlcase($self->{convert});
818# my @ret = map { $conv.'('.$_.')' } @_;
819# return wantarray ? @ret : $ret[0];
820 if ($self->{convert}) {
821 my $conv = $self->_sqlcase($self->{convert});
822 $arg = $conv.'('.$arg.')';
823 }
824 return $arg;
825}
826
827# And bindtype
828sub _bindtype (@) {
829 my $self = shift;
830 my($col, @vals) = @_;
831
832 #LDNOTE : changed original implementation below because it did not make
833 # sense when bindtype eq 'columns' and @vals > 1.
834# return $self->{bindtype} eq 'columns' ? [ $col, @vals ] : @vals;
835
836 return $self->{bindtype} eq 'columns' ? map {[$col, $_]} @vals : @vals;
837}
838
839sub _join_sql_clauses {
840 my ($self, $logic, $clauses_aref, $bind_aref) = @_;
841
842 if (@$clauses_aref > 1) {
843 my $join = " " . $self->_sqlcase($logic) . " ";
844 my $sql = '( ' . join($join, @$clauses_aref) . ' )';
845 return ($sql, @$bind_aref);
846 }
847 elsif (@$clauses_aref) {
848 return ($clauses_aref->[0], @$bind_aref); # no parentheses
849 }
850 else {
851 return (); # if no SQL, ignore @$bind_aref
852 }
853}
854
855
856# Fix SQL case, if so requested
857sub _sqlcase {
858 my $self = shift;
859
860 # LDNOTE: if $self->{case} is true, then it contains 'lower', so we
861 # don't touch the argument ... crooked logic, but let's not change it!
862 return $self->{case} ? $_[0] : uc($_[0]);
863}
864
865
866#======================================================================
867# DISPATCHING FROM REFKIND
868#======================================================================
869
870sub _refkind {
871 my ($self, $data) = @_;
872 my $suffix = '';
873 my $ref;
90aab162 874 my $n_steps = 0;
96449e8e 875
96449e8e 876 while (1) {
90aab162 877 # blessed objects are treated like scalars
878 $ref = (blessed $data) ? '' : ref $data;
879 $n_steps += 1 if $ref;
880 last if $ref ne 'REF';
96449e8e 881 $data = $$data;
882 }
883
90aab162 884 my $base = $ref || (defined $data ? 'SCALAR' : 'UNDEF');
885
886 return $base . ('REF' x $n_steps);
96449e8e 887}
888
90aab162 889
890
96449e8e 891sub _try_refkind {
892 my ($self, $data) = @_;
893 my @try = ($self->_refkind($data));
894 push @try, 'SCALAR_or_UNDEF' if $try[0] eq 'SCALAR' || $try[0] eq 'UNDEF';
895 push @try, 'FALLBACK';
896 return @try;
897}
898
899sub _METHOD_FOR_refkind {
900 my ($self, $meth_prefix, $data) = @_;
901 my $method = first {$_} map {$self->can($meth_prefix."_".$_)}
902 $self->_try_refkind($data)
903 or puke "cannot dispatch on '$meth_prefix' for ".$self->_refkind($data);
904 return $method;
905}
906
907
908sub _SWITCH_refkind {
909 my ($self, $data, $dispatch_table) = @_;
910
911 my $coderef = first {$_} map {$dispatch_table->{$_}}
912 $self->_try_refkind($data)
913 or puke "no dispatch entry for ".$self->_refkind($data);
914 $coderef->();
915}
916
917
918
919
920#======================================================================
921# VALUES, GENERATE, AUTOLOAD
922#======================================================================
923
924# LDNOTE: original code from nwiger, didn't touch code in that section
925# I feel the AUTOLOAD stuff should not be the default, it should
926# only be activated on explicit demand by user.
927
928sub values {
929 my $self = shift;
930 my $data = shift || return;
931 puke "Argument to ", __PACKAGE__, "->values must be a \\%hash"
932 unless ref $data eq 'HASH';
933 return map { $self->_bindtype($_, $data->{$_}) } sort keys %$data;
934}
935
936sub generate {
937 my $self = shift;
938
939 my(@sql, @sqlq, @sqlv);
940
941 for (@_) {
942 my $ref = ref $_;
943 if ($ref eq 'HASH') {
944 for my $k (sort keys %$_) {
945 my $v = $_->{$k};
946 my $r = ref $v;
947 my $label = $self->_quote($k);
948 if ($r eq 'ARRAY') {
949 # SQL included for values
950 my @bind = @$v;
951 my $sql = shift @bind;
952 push @sqlq, "$label = $sql";
953 push @sqlv, $self->_bindtype($k, @bind);
954 } elsif ($r eq 'SCALAR') {
955 # embedded literal SQL
956 push @sqlq, "$label = $$v";
957 } else {
958 push @sqlq, "$label = ?";
959 push @sqlv, $self->_bindtype($k, $v);
960 }
961 }
962 push @sql, $self->_sqlcase('set'), join ', ', @sqlq;
963 } elsif ($ref eq 'ARRAY') {
964 # unlike insert(), assume these are ONLY the column names, i.e. for SQL
965 for my $v (@$_) {
966 my $r = ref $v;
967 if ($r eq 'ARRAY') {
968 my @val = @$v;
969 push @sqlq, shift @val;
970 push @sqlv, @val;
971 } elsif ($r eq 'SCALAR') {
972 # embedded literal SQL
973 push @sqlq, $$v;
974 } else {
975 push @sqlq, '?';
976 push @sqlv, $v;
977 }
978 }
979 push @sql, '(' . join(', ', @sqlq) . ')';
980 } elsif ($ref eq 'SCALAR') {
981 # literal SQL
982 push @sql, $$_;
983 } else {
984 # strings get case twiddled
985 push @sql, $self->_sqlcase($_);
986 }
987 }
988
989 my $sql = join ' ', @sql;
990
991 # this is pretty tricky
992 # if ask for an array, return ($stmt, @bind)
993 # otherwise, s/?/shift @sqlv/ to put it inline
994 if (wantarray) {
995 return ($sql, @sqlv);
996 } else {
997 1 while $sql =~ s/\?/my $d = shift(@sqlv);
998 ref $d ? $d->[1] : $d/e;
999 return $sql;
1000 }
1001}
1002
1003
1004sub DESTROY { 1 }
1005
1006sub AUTOLOAD {
1007 # This allows us to check for a local, then _form, attr
1008 my $self = shift;
1009 my($name) = $AUTOLOAD =~ /.*::(.+)/;
1010 return $self->generate($name, @_);
1011}
1012
10131;
1014
1015
1016
1017__END__
32eab2da 1018
1019=head1 NAME
1020
1021SQL::Abstract - Generate SQL from Perl data structures
1022
1023=head1 SYNOPSIS
1024
1025 use SQL::Abstract;
1026
1027 my $sql = SQL::Abstract->new;
1028
1029 my($stmt, @bind) = $sql->select($table, \@fields, \%where, \@order);
1030
1031 my($stmt, @bind) = $sql->insert($table, \%fieldvals || \@values);
1032
1033 my($stmt, @bind) = $sql->update($table, \%fieldvals, \%where);
1034
1035 my($stmt, @bind) = $sql->delete($table, \%where);
1036
1037 # Then, use these in your DBI statements
1038 my $sth = $dbh->prepare($stmt);
1039 $sth->execute(@bind);
1040
1041 # Just generate the WHERE clause
abe72f94 1042 my($stmt, @bind) = $sql->where(\%where, \@order);
32eab2da 1043
1044 # Return values in the same order, for hashed queries
1045 # See PERFORMANCE section for more details
1046 my @bind = $sql->values(\%fieldvals);
1047
1048=head1 DESCRIPTION
1049
1050This module was inspired by the excellent L<DBIx::Abstract>.
1051However, in using that module I found that what I really wanted
1052to do was generate SQL, but still retain complete control over my
1053statement handles and use the DBI interface. So, I set out to
1054create an abstract SQL generation module.
1055
1056While based on the concepts used by L<DBIx::Abstract>, there are
1057several important differences, especially when it comes to WHERE
1058clauses. I have modified the concepts used to make the SQL easier
1059to generate from Perl data structures and, IMO, more intuitive.
1060The underlying idea is for this module to do what you mean, based
1061on the data structures you provide it. The big advantage is that
1062you don't have to modify your code every time your data changes,
1063as this module figures it out.
1064
1065To begin with, an SQL INSERT is as easy as just specifying a hash
1066of C<key=value> pairs:
1067
1068 my %data = (
1069 name => 'Jimbo Bobson',
1070 phone => '123-456-7890',
1071 address => '42 Sister Lane',
1072 city => 'St. Louis',
1073 state => 'Louisiana',
1074 );
1075
1076The SQL can then be generated with this:
1077
1078 my($stmt, @bind) = $sql->insert('people', \%data);
1079
1080Which would give you something like this:
1081
1082 $stmt = "INSERT INTO people
1083 (address, city, name, phone, state)
1084 VALUES (?, ?, ?, ?, ?)";
1085 @bind = ('42 Sister Lane', 'St. Louis', 'Jimbo Bobson',
1086 '123-456-7890', 'Louisiana');
1087
1088These are then used directly in your DBI code:
1089
1090 my $sth = $dbh->prepare($stmt);
1091 $sth->execute(@bind);
1092
96449e8e 1093=head2 Inserting and Updating Arrays
1094
1095If your database has array types (like for example Postgres),
1096activate the special option C<< array_datatypes => 1 >>
1097when creating the C<SQL::Abstract> object.
1098Then you may use an arrayref to insert and update database array types:
1099
1100 my $sql = SQL::Abstract->new(array_datatypes => 1);
1101 my %data = (
1102 planets => [qw/Mercury Venus Earth Mars/]
1103 );
1104
1105 my($stmt, @bind) = $sql->insert('solar_system', \%data);
1106
1107This results in:
1108
1109 $stmt = "INSERT INTO solar_system (planets) VALUES (?)"
1110
1111 @bind = (['Mercury', 'Venus', 'Earth', 'Mars']);
1112
1113
1114=head2 Inserting and Updating SQL
1115
1116In order to apply SQL functions to elements of your C<%data> you may
1117specify a reference to an arrayref for the given hash value. For example,
1118if you need to execute the Oracle C<to_date> function on a value, you can
1119say something like this:
32eab2da 1120
1121 my %data = (
1122 name => 'Bill',
96449e8e 1123 date_entered => \["to_date(?,'MM/DD/YYYY')", "03/02/2003"],
32eab2da 1124 );
1125
1126The first value in the array is the actual SQL. Any other values are
1127optional and would be included in the bind values array. This gives
1128you:
1129
1130 my($stmt, @bind) = $sql->insert('people', \%data);
1131
1132 $stmt = "INSERT INTO people (name, date_entered)
1133 VALUES (?, to_date(?,'MM/DD/YYYY'))";
1134 @bind = ('Bill', '03/02/2003');
1135
1136An UPDATE is just as easy, all you change is the name of the function:
1137
1138 my($stmt, @bind) = $sql->update('people', \%data);
1139
1140Notice that your C<%data> isn't touched; the module will generate
1141the appropriately quirky SQL for you automatically. Usually you'll
1142want to specify a WHERE clause for your UPDATE, though, which is
1143where handling C<%where> hashes comes in handy...
1144
96449e8e 1145=head2 Complex where statements
1146
32eab2da 1147This module can generate pretty complicated WHERE statements
1148easily. For example, simple C<key=value> pairs are taken to mean
1149equality, and if you want to see if a field is within a set
1150of values, you can use an arrayref. Let's say we wanted to
1151SELECT some data based on this criteria:
1152
1153 my %where = (
1154 requestor => 'inna',
1155 worker => ['nwiger', 'rcwe', 'sfz'],
1156 status => { '!=', 'completed' }
1157 );
1158
1159 my($stmt, @bind) = $sql->select('tickets', '*', \%where);
1160
1161The above would give you something like this:
1162
1163 $stmt = "SELECT * FROM tickets WHERE
1164 ( requestor = ? ) AND ( status != ? )
1165 AND ( worker = ? OR worker = ? OR worker = ? )";
1166 @bind = ('inna', 'completed', 'nwiger', 'rcwe', 'sfz');
1167
1168Which you could then use in DBI code like so:
1169
1170 my $sth = $dbh->prepare($stmt);
1171 $sth->execute(@bind);
1172
1173Easy, eh?
1174
1175=head1 FUNCTIONS
1176
1177The functions are simple. There's one for each major SQL operation,
1178and a constructor you use first. The arguments are specified in a
1179similar order to each function (table, then fields, then a where
1180clause) to try and simplify things.
1181
83cab70b 1182
83cab70b 1183
32eab2da 1184
1185=head2 new(option => 'value')
1186
1187The C<new()> function takes a list of options and values, and returns
1188a new B<SQL::Abstract> object which can then be used to generate SQL
1189through the methods below. The options accepted are:
1190
1191=over
1192
1193=item case
1194
1195If set to 'lower', then SQL will be generated in all lowercase. By
1196default SQL is generated in "textbook" case meaning something like:
1197
1198 SELECT a_field FROM a_table WHERE some_field LIKE '%someval%'
1199
96449e8e 1200Any setting other than 'lower' is ignored.
1201
32eab2da 1202=item cmp
1203
1204This determines what the default comparison operator is. By default
1205it is C<=>, meaning that a hash like this:
1206
1207 %where = (name => 'nwiger', email => 'nate@wiger.org');
1208
1209Will generate SQL like this:
1210
1211 WHERE name = 'nwiger' AND email = 'nate@wiger.org'
1212
1213However, you may want loose comparisons by default, so if you set
1214C<cmp> to C<like> you would get SQL such as:
1215
1216 WHERE name like 'nwiger' AND email like 'nate@wiger.org'
1217
1218You can also override the comparsion on an individual basis - see
1219the huge section on L</"WHERE CLAUSES"> at the bottom.
1220
96449e8e 1221=item sqltrue, sqlfalse
1222
1223Expressions for inserting boolean values within SQL statements.
1224By default these are C<1=1> and C<1=0>.
1225
32eab2da 1226=item logic
1227
1228This determines the default logical operator for multiple WHERE
1229statements in arrays. By default it is "or", meaning that a WHERE
1230array of the form:
1231
1232 @where = (
1233 event_date => {'>=', '2/13/99'},
1234 event_date => {'<=', '4/24/03'},
1235 );
1236
1237Will generate SQL like this:
1238
1239 WHERE event_date >= '2/13/99' OR event_date <= '4/24/03'
1240
1241This is probably not what you want given this query, though (look
1242at the dates). To change the "OR" to an "AND", simply specify:
1243
1244 my $sql = SQL::Abstract->new(logic => 'and');
1245
1246Which will change the above C<WHERE> to:
1247
1248 WHERE event_date >= '2/13/99' AND event_date <= '4/24/03'
1249
96449e8e 1250The logic can also be changed locally by inserting
1251an extra first element in the array :
1252
1253 @where = (-and => event_date => {'>=', '2/13/99'},
1254 event_date => {'<=', '4/24/03'} );
1255
1256See the L</"WHERE CLAUSES"> section for explanations.
1257
32eab2da 1258=item convert
1259
1260This will automatically convert comparisons using the specified SQL
1261function for both column and value. This is mostly used with an argument
1262of C<upper> or C<lower>, so that the SQL will have the effect of
1263case-insensitive "searches". For example, this:
1264
1265 $sql = SQL::Abstract->new(convert => 'upper');
1266 %where = (keywords => 'MaKe iT CAse inSeNSItive');
1267
1268Will turn out the following SQL:
1269
1270 WHERE upper(keywords) like upper('MaKe iT CAse inSeNSItive')
1271
1272The conversion can be C<upper()>, C<lower()>, or any other SQL function
1273that can be applied symmetrically to fields (actually B<SQL::Abstract> does
1274not validate this option; it will just pass through what you specify verbatim).
1275
1276=item bindtype
1277
1278This is a kludge because many databases suck. For example, you can't
1279just bind values using DBI's C<execute()> for Oracle C<CLOB> or C<BLOB> fields.
1280Instead, you have to use C<bind_param()>:
1281
1282 $sth->bind_param(1, 'reg data');
1283 $sth->bind_param(2, $lots, {ora_type => ORA_CLOB});
1284
1285The problem is, B<SQL::Abstract> will normally just return a C<@bind> array,
1286which loses track of which field each slot refers to. Fear not.
1287
1288If you specify C<bindtype> in new, you can determine how C<@bind> is returned.
1289Currently, you can specify either C<normal> (default) or C<columns>. If you
1290specify C<columns>, you will get an array that looks like this:
1291
1292 my $sql = SQL::Abstract->new(bindtype => 'columns');
1293 my($stmt, @bind) = $sql->insert(...);
1294
1295 @bind = (
1296 [ 'column1', 'value1' ],
1297 [ 'column2', 'value2' ],
1298 [ 'column3', 'value3' ],
1299 );
1300
1301You can then iterate through this manually, using DBI's C<bind_param()>.
e3f9dff4 1302
32eab2da 1303 $sth->prepare($stmt);
1304 my $i = 1;
1305 for (@bind) {
1306 my($col, $data) = @$_;
1307 if ($col eq 'details' || $col eq 'comments') {
1308 $sth->bind_param($i, $data, {ora_type => ORA_CLOB});
1309 } elsif ($col eq 'image') {
1310 $sth->bind_param($i, $data, {ora_type => ORA_BLOB});
1311 } else {
1312 $sth->bind_param($i, $data);
1313 }
1314 $i++;
1315 }
1316 $sth->execute; # execute without @bind now
1317
1318Now, why would you still use B<SQL::Abstract> if you have to do this crap?
1319Basically, the advantage is still that you don't have to care which fields
1320are or are not included. You could wrap that above C<for> loop in a simple
1321sub called C<bind_fields()> or something and reuse it repeatedly. You still
1322get a layer of abstraction over manual SQL specification.
1323
1324=item quote_char
1325
1326This is the character that a table or column name will be quoted
1327with. By default this is an empty string, but you could set it to
1328the character C<`>, to generate SQL like this:
1329
1330 SELECT `a_field` FROM `a_table` WHERE `some_field` LIKE '%someval%'
1331
96449e8e 1332Alternatively, you can supply an array ref of two items, the first being the left
1333hand quote character, and the second the right hand quote character. For
1334example, you could supply C<['[',']']> for SQL Server 2000 compliant quotes
1335that generates SQL like this:
1336
1337 SELECT [a_field] FROM [a_table] WHERE [some_field] LIKE '%someval%'
1338
1339Quoting is useful if you have tables or columns names that are reserved
1340words in your database's SQL dialect.
32eab2da 1341
1342=item name_sep
1343
1344This is the character that separates a table and column name. It is
1345necessary to specify this when the C<quote_char> option is selected,
1346so that tables and column names can be individually quoted like this:
1347
1348 SELECT `table`.`one_field` FROM `table` WHERE `table`.`other_field` = 1
1349
96449e8e 1350=item array_datatypes
32eab2da 1351
96449e8e 1352When this option is true, arrayrefs in INSERT or UPDATE are
1353interpreted as array datatypes and are passed directly
1354to the DBI layer.
1355When this option is false, arrayrefs are interpreted
1356as literal SQL, just like refs to arrayrefs
1357(but this behavior is for backwards compatibility; when writing
1358new queries, use the "reference to arrayref" syntax
1359for literal SQL).
32eab2da 1360
32eab2da 1361
96449e8e 1362=item special_ops
32eab2da 1363
96449e8e 1364Takes a reference to a list of "special operators"
1365to extend the syntax understood by L<SQL::Abstract>.
1366See section L</"SPECIAL OPERATORS"> for details.
32eab2da 1367
32eab2da 1368
32eab2da 1369
96449e8e 1370=back
32eab2da 1371
1372=head2 insert($table, \@values || \%fieldvals)
1373
1374This is the simplest function. You simply give it a table name
1375and either an arrayref of values or hashref of field/value pairs.
1376It returns an SQL INSERT statement and a list of bind values.
96449e8e 1377See the sections on L</"Inserting and Updating Arrays"> and
1378L</"Inserting and Updating SQL"> for information on how to insert
1379with those data types.
32eab2da 1380
1381=head2 update($table, \%fieldvals, \%where)
1382
1383This takes a table, hashref of field/value pairs, and an optional
86298391 1384hashref L<WHERE clause|/WHERE CLAUSES>. It returns an SQL UPDATE function and a list
32eab2da 1385of bind values.
96449e8e 1386See the sections on L</"Inserting and Updating Arrays"> and
1387L</"Inserting and Updating SQL"> for information on how to insert
1388with those data types.
32eab2da 1389
96449e8e 1390=head2 select($source, $fields, $where, $order)
32eab2da 1391
96449e8e 1392This returns a SQL SELECT statement and associated list of bind values, as
1393specified by the arguments :
32eab2da 1394
96449e8e 1395=over
32eab2da 1396
96449e8e 1397=item $source
32eab2da 1398
96449e8e 1399Specification of the 'FROM' part of the statement.
1400The argument can be either a plain scalar (interpreted as a table
1401name, will be quoted), or an arrayref (interpreted as a list
1402of table names, joined by commas, quoted), or a scalarref
1403(literal table name, not quoted), or a ref to an arrayref
1404(list of literal table names, joined by commas, not quoted).
32eab2da 1405
96449e8e 1406=item $fields
32eab2da 1407
96449e8e 1408Specification of the list of fields to retrieve from
1409the source.
1410The argument can be either an arrayref (interpreted as a list
1411of field names, will be joined by commas and quoted), or a
1412plain scalar (literal SQL, not quoted).
1413Please observe that this API is not as flexible as for
e3f9dff4 1414the first argument C<$table>, for backwards compatibility reasons.
32eab2da 1415
96449e8e 1416=item $where
32eab2da 1417
96449e8e 1418Optional argument to specify the WHERE part of the query.
1419The argument is most often a hashref, but can also be
1420an arrayref or plain scalar --
1421see section L<WHERE clause|/"WHERE CLAUSES"> for details.
32eab2da 1422
96449e8e 1423=item $order
32eab2da 1424
96449e8e 1425Optional argument to specify the ORDER BY part of the query.
1426The argument can be a scalar, a hashref or an arrayref
1427-- see section L<ORDER BY clause|/"ORDER BY CLAUSES">
1428for details.
32eab2da 1429
96449e8e 1430=back
32eab2da 1431
32eab2da 1432
1433=head2 delete($table, \%where)
1434
86298391 1435This takes a table name and optional hashref L<WHERE clause|/WHERE CLAUSES>.
32eab2da 1436It returns an SQL DELETE statement and list of bind values.
1437
32eab2da 1438=head2 where(\%where, \@order)
1439
1440This is used to generate just the WHERE clause. For example,
1441if you have an arbitrary data structure and know what the
1442rest of your SQL is going to look like, but want an easy way
1443to produce a WHERE clause, use this. It returns an SQL WHERE
1444clause and list of bind values.
1445
32eab2da 1446
1447=head2 values(\%data)
1448
1449This just returns the values from the hash C<%data>, in the same
1450order that would be returned from any of the other above queries.
1451Using this allows you to markedly speed up your queries if you
1452are affecting lots of rows. See below under the L</"PERFORMANCE"> section.
1453
32eab2da 1454=head2 generate($any, 'number', $of, \@data, $struct, \%types)
1455
1456Warning: This is an experimental method and subject to change.
1457
1458This returns arbitrarily generated SQL. It's a really basic shortcut.
1459It will return two different things, depending on return context:
1460
1461 my($stmt, @bind) = $sql->generate('create table', \$table, \@fields);
1462 my $stmt_and_val = $sql->generate('create table', \$table, \@fields);
1463
1464These would return the following:
1465
1466 # First calling form
1467 $stmt = "CREATE TABLE test (?, ?)";
1468 @bind = (field1, field2);
1469
1470 # Second calling form
1471 $stmt_and_val = "CREATE TABLE test (field1, field2)";
1472
1473Depending on what you're trying to do, it's up to you to choose the correct
1474format. In this example, the second form is what you would want.
1475
1476By the same token:
1477
1478 $sql->generate('alter session', { nls_date_format => 'MM/YY' });
1479
1480Might give you:
1481
1482 ALTER SESSION SET nls_date_format = 'MM/YY'
1483
1484You get the idea. Strings get their case twiddled, but everything
1485else remains verbatim.
1486
32eab2da 1487
32eab2da 1488
32eab2da 1489
1490=head1 WHERE CLAUSES
1491
96449e8e 1492=head2 Introduction
1493
32eab2da 1494This module uses a variation on the idea from L<DBIx::Abstract>. It
1495is B<NOT>, repeat I<not> 100% compatible. B<The main logic of this
1496module is that things in arrays are OR'ed, and things in hashes
1497are AND'ed.>
1498
1499The easiest way to explain is to show lots of examples. After
1500each C<%where> hash shown, it is assumed you used:
1501
1502 my($stmt, @bind) = $sql->where(\%where);
1503
1504However, note that the C<%where> hash can be used directly in any
1505of the other functions as well, as described above.
1506
96449e8e 1507=head2 Key-value pairs
1508
32eab2da 1509So, let's get started. To begin, a simple hash:
1510
1511 my %where = (
1512 user => 'nwiger',
1513 status => 'completed'
1514 );
1515
1516Is converted to SQL C<key = val> statements:
1517
1518 $stmt = "WHERE user = ? AND status = ?";
1519 @bind = ('nwiger', 'completed');
1520
1521One common thing I end up doing is having a list of values that
1522a field can be in. To do this, simply specify a list inside of
1523an arrayref:
1524
1525 my %where = (
1526 user => 'nwiger',
1527 status => ['assigned', 'in-progress', 'pending'];
1528 );
1529
1530This simple code will create the following:
1531
1532 $stmt = "WHERE user = ? AND ( status = ? OR status = ? OR status = ? )";
1533 @bind = ('nwiger', 'assigned', 'in-progress', 'pending');
1534
96449e8e 1535An empty arrayref will be considered a logical false and
8a68b5be 1536will generate 0=1.
1537
96449e8e 1538=head2 Key-value pairs
1539
32eab2da 1540If you want to specify a different type of operator for your comparison,
1541you can use a hashref for a given column:
1542
1543 my %where = (
1544 user => 'nwiger',
1545 status => { '!=', 'completed' }
1546 );
1547
1548Which would generate:
1549
1550 $stmt = "WHERE user = ? AND status != ?";
1551 @bind = ('nwiger', 'completed');
1552
1553To test against multiple values, just enclose the values in an arrayref:
1554
1555 status => { '!=', ['assigned', 'in-progress', 'pending'] };
1556
1557Which would give you:
1558
96449e8e 1559 "WHERE status != ? AND status != ? AND status != ?"
32eab2da 1560
96449e8e 1561Notice that since the operator was recognized as being a 'negative'
1562operator, the arrayref was interpreted with 'AND' logic (because
1563of Morgan's laws). By contrast, the reverse
1564
1565 status => { '=', ['assigned', 'in-progress', 'pending'] };
1566
1567would generate :
1568
1569 "WHERE status = ? OR status = ? OR status = ?"
1570
1571
1572The hashref can also contain multiple pairs, in which case it is expanded
32eab2da 1573into an C<AND> of its elements:
1574
1575 my %where = (
1576 user => 'nwiger',
1577 status => { '!=', 'completed', -not_like => 'pending%' }
1578 );
1579
1580 # Or more dynamically, like from a form
1581 $where{user} = 'nwiger';
1582 $where{status}{'!='} = 'completed';
1583 $where{status}{'-not_like'} = 'pending%';
1584
1585 # Both generate this
1586 $stmt = "WHERE user = ? AND status != ? AND status NOT LIKE ?";
1587 @bind = ('nwiger', 'completed', 'pending%');
1588
96449e8e 1589
32eab2da 1590To get an OR instead, you can combine it with the arrayref idea:
1591
1592 my %where => (
1593 user => 'nwiger',
1594 priority => [ {'=', 2}, {'!=', 1} ]
1595 );
1596
1597Which would generate:
1598
1599 $stmt = "WHERE user = ? AND priority = ? OR priority != ?";
1600 @bind = ('nwiger', '2', '1');
1601
96449e8e 1602
1603=head2 Logic and nesting operators
1604
1605In the example above,
1606there is a subtle trap if you want to say something like
32eab2da 1607this (notice the C<AND>):
1608
1609 WHERE priority != ? AND priority != ?
1610
1611Because, in Perl you I<can't> do this:
1612
1613 priority => { '!=', 2, '!=', 1 }
1614
1615As the second C<!=> key will obliterate the first. The solution
1616is to use the special C<-modifier> form inside an arrayref:
1617
96449e8e 1618 priority => [ -and => {'!=', 2},
1619 {'!=', 1} ]
1620
32eab2da 1621
1622Normally, these would be joined by C<OR>, but the modifier tells it
1623to use C<AND> instead. (Hint: You can use this in conjunction with the
1624C<logic> option to C<new()> in order to change the way your queries
1625work by default.) B<Important:> Note that the C<-modifier> goes
1626B<INSIDE> the arrayref, as an extra first element. This will
1627B<NOT> do what you think it might:
1628
1629 priority => -and => [{'!=', 2}, {'!=', 1}] # WRONG!
1630
1631Here is a quick list of equivalencies, since there is some overlap:
1632
1633 # Same
1634 status => {'!=', 'completed', 'not like', 'pending%' }
1635 status => [ -and => {'!=', 'completed'}, {'not like', 'pending%'}]
1636
1637 # Same
1638 status => {'=', ['assigned', 'in-progress']}
1639 status => [ -or => {'=', 'assigned'}, {'=', 'in-progress'}]
1640 status => [ {'=', 'assigned'}, {'=', 'in-progress'} ]
1641
1642In addition to C<-and> and C<-or>, there is also a special C<-nest>
1643operator which adds an additional set of parens, to create a subquery.
1644For example, to get something like this:
1645
86298391 1646 $stmt = "WHERE user = ? AND ( workhrs > ? OR geo = ? )";
32eab2da 1647 @bind = ('nwiger', '20', 'ASIA');
1648
1649You would do:
1650
1651 my %where = (
1652 user => 'nwiger',
1653 -nest => [ workhrs => {'>', 20}, geo => 'ASIA' ],
1654 );
1655
e3f9dff4 1656If you need several nested subexpressions, you can number
1657the C<-nest> branches :
1658
1659 my %where = (
1660 user => 'nwiger',
1661 -nest1 => ...,
1662 -nest2 => ...,
1663 ...
1664 );
1665
1666
96449e8e 1667=head2 Special operators : IN, BETWEEN, etc.
1668
32eab2da 1669You can also use the hashref format to compare a list of fields using the
1670C<IN> comparison operator, by specifying the list as an arrayref:
1671
1672 my %where = (
1673 status => 'completed',
1674 reportid => { -in => [567, 2335, 2] }
1675 );
1676
1677Which would generate:
1678
1679 $stmt = "WHERE status = ? AND reportid IN (?,?,?)";
1680 @bind = ('completed', '567', '2335', '2');
1681
96449e8e 1682The reverse operator C<-not_in> generates SQL C<NOT IN> and is used in
1683the same way.
1684
1685Another pair of operators is C<-between> and C<-not_between>,
1686used with an arrayref of two values:
32eab2da 1687
1688 my %where = (
1689 user => 'nwiger',
1690 completion_date => {
1691 -not_between => ['2002-10-01', '2003-02-06']
1692 }
1693 );
1694
1695Would give you:
1696
1697 WHERE user = ? AND completion_date NOT BETWEEN ( ? AND ? )
1698
96449e8e 1699These are the two builtin "special operators"; but the
1700list can be expanded : see section L</"SPECIAL OPERATORS"> below.
1701
1702=head2 Nested conditions
1703
32eab2da 1704So far, we've seen how multiple conditions are joined with a top-level
1705C<AND>. We can change this by putting the different conditions we want in
1706hashes and then putting those hashes in an array. For example:
1707
1708 my @where = (
1709 {
1710 user => 'nwiger',
1711 status => { -like => ['pending%', 'dispatched'] },
1712 },
1713 {
1714 user => 'robot',
1715 status => 'unassigned',
1716 }
1717 );
1718
1719This data structure would create the following:
1720
1721 $stmt = "WHERE ( user = ? AND ( status LIKE ? OR status LIKE ? ) )
1722 OR ( user = ? AND status = ? ) )";
1723 @bind = ('nwiger', 'pending', 'dispatched', 'robot', 'unassigned');
1724
1725This can be combined with the C<-nest> operator to properly group
1726SQL statements:
1727
1728 my @where = (
1729 -and => [
1730 user => 'nwiger',
1731 -nest => [
d2a8fe1a 1732 ["-and", workhrs => {'>', 20}, geo => 'ASIA' ],
1733 ["-and", workhrs => {'<', 50}, geo => 'EURO' ]
32eab2da 1734 ],
1735 ],
1736 );
1737
1738That would yield:
1739
1740 WHERE ( user = ? AND
1741 ( ( workhrs > ? AND geo = ? )
1742 OR ( workhrs < ? AND geo = ? ) ) )
1743
96449e8e 1744=head2 Literal SQL
1745
32eab2da 1746Finally, sometimes only literal SQL will do. If you want to include
1747literal SQL verbatim, you can specify it as a scalar reference, namely:
1748
1749 my $inn = 'is Not Null';
1750 my %where = (
1751 priority => { '<', 2 },
1752 requestor => \$inn
1753 );
1754
1755This would create:
1756
1757 $stmt = "WHERE priority < ? AND requestor is Not Null";
1758 @bind = ('2');
1759
1760Note that in this example, you only get one bind parameter back, since
1761the verbatim SQL is passed as part of the statement.
1762
1763Of course, just to prove a point, the above can also be accomplished
1764with this:
1765
1766 my %where = (
1767 priority => { '<', 2 },
1768 requestor => { '!=', undef },
1769 );
1770
96449e8e 1771
32eab2da 1772TMTOWTDI.
1773
96449e8e 1774Conditions on boolean columns can be expressed in the
1775same way, passing a reference to an empty string :
1776
1777 my %where = (
1778 priority => { '<', 2 },
1779 is_ready => \"";
1780 );
1781
1782which yields
1783
1784 $stmt = "WHERE priority < ? AND is_ready";
1785 @bind = ('2');
1786
1787
1788=head2 Literal SQL with placeholders and bind values (subqueries)
1789
1790If the literal SQL to be inserted has placeholders and bind values,
1791use a reference to an arrayref (yes this is a double reference --
1792not so common, but perfectly legal Perl). For example, to find a date
1793in Postgres you can use something like this:
1794
1795 my %where = (
1796 date_column => \[q/= date '2008-09-30' - ?::integer/, 10/]
1797 )
1798
1799This would create:
1800
d2a8fe1a 1801 $stmt = "WHERE ( date_column = date '2008-09-30' - ?::integer )"
96449e8e 1802 @bind = ('10');
1803
1804
1805Literal SQL is especially useful for nesting parenthesized clauses in the
1806main SQL query. Here is a first example :
1807
1808 my ($sub_stmt, @sub_bind) = ("SELECT c1 FROM t1 WHERE c2 < ? AND c3 LIKE ?",
1809 100, "foo%");
1810 my %where = (
1811 foo => 1234,
1812 bar => \["IN ($sub_stmt)" => @sub_bind],
1813 );
1814
1815This yields :
1816
1817 $stmt = "WHERE (foo = ? AND bar IN (SELECT c1 FROM t1
1818 WHERE c2 < ? AND c3 LIKE ?))";
1819 @bind = (1234, 100, "foo%");
1820
1821Other subquery operators, like for example C<"E<gt> ALL"> or C<"NOT IN">,
1822are expressed in the same way. Of course the C<$sub_stmt> and
1823its associated bind values can be generated through a former call
1824to C<select()> :
1825
1826 my ($sub_stmt, @sub_bind)
1827 = $sql->select("t1", "c1", {c2 => {"<" => 100},
1828 c3 => {-like => "foo%"}});
1829 my %where = (
1830 foo => 1234,
1831 bar => \["> ALL ($sub_stmt)" => @sub_bind],
1832 );
1833
1834In the examples above, the subquery was used as an operator on a column;
1835but the same principle also applies for a clause within the main C<%where>
1836hash, like an EXISTS subquery :
1837
1838 my ($sub_stmt, @sub_bind)
1839 = $sql->select("t1", "*", {c1 => 1, c2 => \"> t0.c0"});
1840 my %where = (
1841 foo => 1234,
1842 -nest => \["EXISTS ($sub_stmt)" => @sub_bind],
1843 );
1844
1845which yields
1846
1847 $stmt = "WHERE (foo = ? AND EXISTS (SELECT * FROM t1
1848 WHERE c1 = ? AND c2 > t0.c0))";
1849 @bind = (1234, 1);
1850
1851
1852Observe that the condition on C<c2> in the subquery refers to
1853column C<t0.c0> of the main query : this is I<not> a bind
1854value, so we have to express it through a scalar ref.
1855Writing C<< c2 => {">" => "t0.c0"} >> would have generated
1856C<< c2 > ? >> with bind value C<"t0.c0"> ... not exactly
1857what we wanted here.
1858
1859Another use of the subquery technique is when some SQL clauses need
1860parentheses, as it often occurs with some proprietary SQL extensions
1861like for example fulltext expressions, geospatial expressions,
1862NATIVE clauses, etc. Here is an example of a fulltext query in MySQL :
1863
1864 my %where = (
1865 -nest => \["MATCH (col1, col2) AGAINST (?)" => qw/apples/]
1866 );
1867
1868Finally, here is an example where a subquery is used
1869for expressing unary negation:
1870
1871 my ($sub_stmt, @sub_bind)
1872 = $sql->where({age => [{"<" => 10}, {">" => 20}]});
1873 $sub_stmt =~ s/^ where //i; # don't want "WHERE" in the subclause
1874 my %where = (
1875 lname => {like => '%son%'},
1876 -nest => \["NOT ($sub_stmt)" => @sub_bind],
1877 );
1878
1879This yields
1880
1881 $stmt = "lname LIKE ? AND NOT ( age < ? OR age > ? )"
1882 @bind = ('%son%', 10, 20)
1883
1884
1885
1886=head2 Conclusion
1887
32eab2da 1888These pages could go on for a while, since the nesting of the data
1889structures this module can handle are pretty much unlimited (the
1890module implements the C<WHERE> expansion as a recursive function
1891internally). Your best bet is to "play around" with the module a
1892little to see how the data structures behave, and choose the best
1893format for your data based on that.
1894
1895And of course, all the values above will probably be replaced with
1896variables gotten from forms or the command line. After all, if you
1897knew everything ahead of time, you wouldn't have to worry about
1898dynamically-generating SQL and could just hardwire it into your
1899script.
1900
96449e8e 1901
1902
1903
86298391 1904=head1 ORDER BY CLAUSES
1905
1906Some functions take an order by clause. This can either be a scalar (just a
1907column name,) a hash of C<< { -desc => 'col' } >> or C<< { -asc => 'col' } >>,
1cfa1db3 1908or an array of either of the two previous forms. Examples:
1909
1910 Given | Will Generate
1911 ----------------------------------------------------------
1912 \'colA DESC' | ORDER BY colA DESC
1913 'colA' | ORDER BY colA
1914 [qw/colA colB/] | ORDER BY colA, colB
1915 {-asc => 'colA'} | ORDER BY colA ASC
1916 {-desc => 'colB'} | ORDER BY colB DESC
1917 [ |
1918 {-asc => 'colA'}, | ORDER BY colA ASC, colB DESC
1919 {-desc => 'colB'} |
1920 ] |
1921 [colA => {-asc => 'colB'}] | ORDER BY colA, colB ASC
1922 ==========================================================
86298391 1923
96449e8e 1924
1925
1926=head1 SPECIAL OPERATORS
1927
e3f9dff4 1928 my $sqlmaker = SQL::Abstract->new(special_ops => [
1929 {regex => qr/.../,
1930 handler => sub {
1931 my ($self, $field, $op, $arg) = @_;
1932 ...
1933 },
1934 },
1935 ]);
1936
1937A "special operator" is a SQL syntactic clause that can be
1938applied to a field, instead of a usual binary operator.
1939For example :
1940
1941 WHERE field IN (?, ?, ?)
1942 WHERE field BETWEEN ? AND ?
1943 WHERE MATCH(field) AGAINST (?, ?)
96449e8e 1944
e3f9dff4 1945Special operators IN and BETWEEN are fairly standard and therefore
1946are builtin within C<SQL::Abstract>. For other operators,
1947like the MATCH .. AGAINST example above which is
1948specific to MySQL, you can write your own operator handlers :
1949supply a C<special_ops> argument to the C<new> method.
1950That argument takes an arrayref of operator definitions;
1951each operator definition is a hashref with two entries
96449e8e 1952
e3f9dff4 1953=over
1954
1955=item regex
1956
1957the regular expression to match the operator
96449e8e 1958
e3f9dff4 1959=item handler
1960
1961coderef that will be called when meeting that operator
1962in the input tree. The coderef will be called with
1963arguments C<< ($self, $field, $op, $arg) >>, and
1964should return a C<< ($sql, @bind) >> structure.
1965
1966=back
1967
1968For example, here is an implementation
1969of the MATCH .. AGAINST syntax for MySQL
1970
1971 my $sqlmaker = SQL::Abstract->new(special_ops => [
1972
1973 # special op for MySql MATCH (field) AGAINST(word1, word2, ...)
1974 {regex => qr/^match$/i,
1975 handler => sub {
1976 my ($self, $field, $op, $arg) = @_;
1977 $arg = [$arg] if not ref $arg;
1978 my $label = $self->_quote($field);
1979 my ($placeholder) = $self->_convert('?');
1980 my $placeholders = join ", ", (($placeholder) x @$arg);
1981 my $sql = $self->_sqlcase('match') . " ($label) "
1982 . $self->_sqlcase('against') . " ($placeholders) ";
1983 my @bind = $self->_bindtype($field, @$arg);
1984 return ($sql, @bind);
1985 }
1986 },
1987
1988 ]);
96449e8e 1989
1990
32eab2da 1991=head1 PERFORMANCE
1992
1993Thanks to some benchmarking by Mark Stosberg, it turns out that
1994this module is many orders of magnitude faster than using C<DBIx::Abstract>.
1995I must admit this wasn't an intentional design issue, but it's a
1996byproduct of the fact that you get to control your C<DBI> handles
1997yourself.
1998
1999To maximize performance, use a code snippet like the following:
2000
2001 # prepare a statement handle using the first row
2002 # and then reuse it for the rest of the rows
2003 my($sth, $stmt);
2004 for my $href (@array_of_hashrefs) {
2005 $stmt ||= $sql->insert('table', $href);
2006 $sth ||= $dbh->prepare($stmt);
2007 $sth->execute($sql->values($href));
2008 }
2009
2010The reason this works is because the keys in your C<$href> are sorted
2011internally by B<SQL::Abstract>. Thus, as long as your data retains
2012the same structure, you only have to generate the SQL the first time
2013around. On subsequent queries, simply use the C<values> function provided
2014by this module to return your values in the correct order.
2015
96449e8e 2016
32eab2da 2017=head1 FORMBUILDER
2018
2019If you use my C<CGI::FormBuilder> module at all, you'll hopefully
2020really like this part (I do, at least). Building up a complex query
2021can be as simple as the following:
2022
2023 #!/usr/bin/perl
2024
2025 use CGI::FormBuilder;
2026 use SQL::Abstract;
2027
2028 my $form = CGI::FormBuilder->new(...);
2029 my $sql = SQL::Abstract->new;
2030
2031 if ($form->submitted) {
2032 my $field = $form->field;
2033 my $id = delete $field->{id};
2034 my($stmt, @bind) = $sql->update('table', $field, {id => $id});
2035 }
2036
2037Of course, you would still have to connect using C<DBI> to run the
2038query, but the point is that if you make your form look like your
2039table, the actual query script can be extremely simplistic.
2040
2041If you're B<REALLY> lazy (I am), check out C<HTML::QuickTable> for
2042a fast interface to returning and formatting data. I frequently
2043use these three modules together to write complex database query
2044apps in under 50 lines.
2045
32eab2da 2046
96449e8e 2047=head1 CHANGES
2048
2049Version 1.50 was a major internal refactoring of C<SQL::Abstract>.
2050Great care has been taken to preserve the I<published> behavior
2051documented in previous versions in the 1.* family; however,
2052some features that were previously undocumented, or behaved
2053differently from the documentation, had to be changed in order
2054to clarify the semantics. Hence, client code that was relying
2055on some dark areas of C<SQL::Abstract> v1.*
2056B<might behave differently> in v1.50.
32eab2da 2057
d2a8fe1a 2058The main changes are :
2059
96449e8e 2060=over
32eab2da 2061
96449e8e 2062=item *
32eab2da 2063
96449e8e 2064support for literal SQL through the C<< \ [$sql, bind] >> syntax.
2065
2066=item *
2067
2068added -nest1, -nest2 or -nest_1, -nest_2, ...
2069
2070=item *
2071
2072optional support for L<array datatypes|/"Inserting and Updating Arrays">
2073
2074=item *
2075
2076defensive programming : check arguments
2077
2078=item *
2079
2080fixed bug with global logic, which was previously implemented
2081through global variables yielding side-effects. Prior versons would
2082interpret C<< [ {cond1, cond2}, [cond3, cond4] ] >>
2083as C<< "(cond1 AND cond2) OR (cond3 AND cond4)" >>.
2084Now this is interpreted
2085as C<< "(cond1 AND cond2) OR (cond3 OR cond4)" >>.
2086
2087=item *
2088
2089C<-and> / C<-or> operators are no longer accepted
2090in the middle of an arrayref : they are
2091only admitted if in first position.
2092
2093=item *
2094
2095changed logic for distributing an op over arrayrefs
2096
2097=item *
2098
2099fixed semantics of _bindtype on array args
2100
2101=item *
2102
2103dropped the C<_anoncopy> of the %where tree. No longer necessary,
2104we just avoid shifting arrays within that tree.
2105
2106=item *
2107
2108dropped the C<_modlogic> function
2109
2110=back
32eab2da 2111
32eab2da 2112
32eab2da 2113
2114=head1 ACKNOWLEDGEMENTS
2115
2116There are a number of individuals that have really helped out with
2117this module. Unfortunately, most of them submitted bugs via CPAN
2118so I have no idea who they are! But the people I do know are:
2119
86298391 2120 Ash Berlin (order_by hash term support)
b643abe1 2121 Matt Trout (DBIx::Class support)
32eab2da 2122 Mark Stosberg (benchmarking)
2123 Chas Owens (initial "IN" operator support)
2124 Philip Collins (per-field SQL functions)
2125 Eric Kolve (hashref "AND" support)
2126 Mike Fragassi (enhancements to "BETWEEN" and "LIKE")
2127 Dan Kubb (support for "quote_char" and "name_sep")
f5aab26e 2128 Guillermo Roditi (patch to cleanup "IN" and "BETWEEN", fix and tests for _order_by)
96449e8e 2129 Laurent Dami (internal refactoring, multiple -nest, extensible list of special operators, literal SQL)
32eab2da 2130
2131Thanks!
2132
32eab2da 2133=head1 SEE ALSO
2134
86298391 2135L<DBIx::Class>, L<DBIx::Abstract>, L<CGI::FormBuilder>, L<HTML::QuickTable>.
32eab2da 2136
32eab2da 2137=head1 AUTHOR
2138
b643abe1 2139Copyright (c) 2001-2007 Nathan Wiger <nwiger@cpan.org>. All Rights Reserved.
2140
2141This module is actively maintained by Matt Trout <mst@shadowcatsystems.co.uk>
32eab2da 2142
abe72f94 2143For support, your best bet is to try the C<DBIx::Class> users mailing list.
2144While not an official support venue, C<DBIx::Class> makes heavy use of
2145C<SQL::Abstract>, and as such list members there are very familiar with
2146how to create queries.
2147
32eab2da 2148This module is free software; you may copy this under the terms of
2149the GNU General Public License, or the Artistic License, copies of
2150which should have accompanied your Perl kit.
2151
2152=cut
2153