Variation of dq's d35a4e048 - sanify multiplying join prune
[dbsrgits/DBIx-Class-Historic.git] / lib / DBIx / Class / Storage / DBIHacks.pm
CommitLineData
c443438f 1package #hide from PAUSE
2 DBIx::Class::Storage::DBIHacks;
d28bb90d 3
4#
5# This module contains code that should never have seen the light of day,
6# does not belong in the Storage, or is otherwise unfit for public
6a6394f1 7# display. The arrival of SQLA2 should immediately obsolete 90% of this
d28bb90d 8#
9
10use strict;
11use warnings;
12
13use base 'DBIx::Class::Storage';
14use mro 'c3';
15
6298a324 16use List::Util 'first';
17use Scalar::Util 'blessed';
ea5c7509 18use Sub::Name 'subname';
6298a324 19use namespace::clean;
d28bb90d 20
21#
052e8431 22# This code will remove non-selecting/non-restricting joins from
4b1b5ea3 23# {from} specs, aiding the RDBMS query optimizer
052e8431 24#
25sub _prune_unused_joins {
ea95892e 26 my $self = shift;
437a9cfa 27 my ($from, $select, $where, $attrs) = @_;
052e8431 28
ea95892e 29 return $from unless $self->_use_join_optimizer;
30
052e8431 31 if (ref $from ne 'ARRAY' || ref $from->[0] ne 'HASH' || ref $from->[1] ne 'ARRAY') {
32 return $from; # only standard {from} specs are supported
33 }
34
4b1b5ea3 35 my $aliastypes = $self->_resolve_aliastypes_from_select_args(@_);
36
97e130fa 37 # don't care
38 delete $aliastypes->{joining};
39
4b1b5ea3 40 # a grouped set will not be affected by amount of rows. Thus any
41 # {multiplying} joins can go
97e130fa 42 delete $aliastypes->{multiplying}
437a9cfa 43 if $attrs->{_force_prune_multiplying_joins} or $attrs->{group_by};
4b1b5ea3 44
052e8431 45 my @newfrom = $from->[0]; # FROM head is always present
46
a4812caa 47 my %need_joins;
97e130fa 48
a4812caa 49 for (values %$aliastypes) {
50 # add all requested aliases
51 $need_joins{$_} = 1 for keys %$_;
52
53 # add all their parents (as per joinpath which is an AoH { table => alias })
97e130fa 54 $need_joins{$_} = 1 for map { values %$_ } map { @{$_->{-parents}} } values %$_;
a4812caa 55 }
97e130fa 56
052e8431 57 for my $j (@{$from}[1..$#$from]) {
539ffe87 58 push @newfrom, $j if (
4b1b5ea3 59 (! $j->[0]{-alias}) # legacy crap
539ffe87 60 ||
61 $need_joins{$j->[0]{-alias}}
62 );
052e8431 63 }
64
65 return \@newfrom;
66}
67
052e8431 68#
d28bb90d 69# This is the code producing joined subqueries like:
8273e845 70# SELECT me.*, other.* FROM ( SELECT me.* FROM ... ) JOIN other ON ...
d28bb90d 71#
72sub _adjust_select_args_for_complex_prefetch {
73 my ($self, $from, $select, $where, $attrs) = @_;
74
d28bb90d 75 $self->throw_exception ('Complex prefetches are not supported on resultsets with a custom from attribute')
76 if (ref $from ne 'ARRAY' || ref $from->[0] ne 'HASH' || ref $from->[1] ne 'ARRAY');
77
1e4f9fb3 78 my $root_alias = $attrs->{alias};
79
d28bb90d 80 # generate inner/outer attribute lists, remove stuff that doesn't apply
81 my $outer_attrs = { %$attrs };
1e4f9fb3 82 delete $outer_attrs->{$_} for qw/where bind rows offset group_by _grouped_by_distinct having/;
d28bb90d 83
186ba34c 84 my $inner_attrs = { %$attrs };
1e4f9fb3 85 delete $inner_attrs->{$_} for qw/from for collapse select as _related_results_construction/;
d28bb90d 86
4df1400e 87 # there is no point of ordering the insides if there is no limit
88 delete $inner_attrs->{order_by} if (
89 delete $inner_attrs->{_order_is_artificial}
90 or
91 ! $inner_attrs->{rows}
92 );
946f6260 93
d28bb90d 94 # generate the inner/outer select lists
95 # for inside we consider only stuff *not* brought in by the prefetch
96 # on the outside we substitute any function for its alias
97 my $outer_select = [ @$select ];
97e130fa 98 my $inner_select;
36fd7f07 99
97e130fa 100 my ($root_node, $root_node_offset);
27e0370d 101
102 for my $i (0 .. $#$from) {
103 my $node = $from->[$i];
104 my $h = (ref $node eq 'HASH') ? $node
105 : (ref $node eq 'ARRAY' and ref $node->[0] eq 'HASH') ? $node->[0]
106 : next
107 ;
108
1e4f9fb3 109 if ( ($h->{-alias}||'') eq $root_alias and $h->{-rsrc} ) {
97e130fa 110 $root_node = $h;
111 $root_node_offset = $i;
27e0370d 112 last;
113 }
114 }
115
116 $self->throw_exception ('Complex prefetches are not supported on resultsets with a custom from attribute')
97e130fa 117 unless $root_node;
27e0370d 118
119 # use the heavy duty resolver to take care of aliased/nonaliased naming
120 my $colinfo = $self->_resolve_column_info($from);
121 my $selected_root_columns;
122
1e4f9fb3 123 for my $i (0 .. $#$outer_select) {
d28bb90d 124 my $sel = $outer_select->[$i];
125
1e4f9fb3 126 next if (
127 $colinfo->{$sel} and $colinfo->{$sel}{-source_alias} ne $root_alias
128 );
129
d28bb90d 130 if (ref $sel eq 'HASH' ) {
131 $sel->{-as} ||= $attrs->{as}[$i];
1e4f9fb3 132 $outer_select->[$i] = join ('.', $root_alias, ($sel->{-as} || "inner_column_$i") );
d28bb90d 133 }
27e0370d 134 elsif (! ref $sel and my $ci = $colinfo->{$sel}) {
135 $selected_root_columns->{$ci->{-colname}} = 1;
136 }
d28bb90d 137
138 push @$inner_select, $sel;
bb9bffea 139
140 push @{$inner_attrs->{as}}, $attrs->{as}[$i];
d28bb90d 141 }
142
97e130fa 143 # We will need to fetch all native columns in the inner subquery, which may
144 # be a part of an *outer* join condition, or an order_by (which needs to be
145 # preserved outside)
146 # We can not just fetch everything because a potential has_many restricting
147 # join collapse *will not work* on heavy data types.
148 my $connecting_aliastypes = $self->_resolve_aliastypes_from_select_args(
149 [grep { ref($_) eq 'ARRAY' or ref($_) eq 'HASH' } @{$from}[$root_node_offset .. $#$from]],
150 [],
151 $where,
152 $inner_attrs
153 );
154
155 for (sort map { keys %{$_->{-seen_columns}||{}} } map { values %$_ } values %$connecting_aliastypes) {
156 my $ci = $colinfo->{$_} or next;
157 if (
1e4f9fb3 158 $ci->{-source_alias} eq $root_alias
97e130fa 159 and
160 ! $selected_root_columns->{$ci->{-colname}}++
161 ) {
162 # adding it to both to keep limits not supporting dark selectors happy
163 push @$inner_select, $ci->{-fq_colname};
164 push @{$inner_attrs->{as}}, $ci->{-fq_colname};
27e0370d 165 }
166 }
167
ea95892e 168 # construct the inner $from and lock it in a subquery
48580715 169 # we need to prune first, because this will determine if we need a group_by below
97e130fa 170 # throw away all non-selecting, non-restricting multijoins
171 # (since we def. do not care about multiplication those inside the subquery)
6395604e 172 my $inner_subq = do {
ea95892e 173
174 # must use it here regardless of user requests
175 local $self->{_use_join_optimizer} = 1;
176
97e130fa 177 # throw away multijoins since we def. do not care about those inside the subquery
437a9cfa 178 my $inner_from = $self->_prune_unused_joins ($from, $inner_select, $where, {
179 %$inner_attrs, _force_prune_multiplying_joins => 1
180 });
ea95892e 181
887a0aef 182 my $inner_aliastypes =
183 $self->_resolve_aliastypes_from_select_args( $inner_from, $inner_select, $where, $inner_attrs );
184
1e4f9fb3 185 # uh-oh a multiplier (which is not us) left in, this is a problem
0a3441ee 186 if (
1e4f9fb3 187 $inner_aliastypes->{multiplying}
188 and
189 !$inner_aliastypes->{grouping} # if there are groups - assume user knows wtf they are up to
0a3441ee 190 and
1e4f9fb3 191 my @multipliers = grep { $_ ne $root_alias } keys %{$inner_aliastypes->{multiplying}}
0a3441ee 192 ) {
1e4f9fb3 193
194 # if none of the multipliers came from an order_by (guaranteed to have been combined
195 # with a limit) - easy - just slap a group_by to simulate a collape and be on our way
196 if (
197 ! $inner_aliastypes->{ordering}
198 or
199 ! first { $inner_aliastypes->{ordering}{$_} } @multipliers
200 ) {
318e3d94 201
1e4f9fb3 202 my $unprocessed_order_chunks;
203 ($inner_attrs->{group_by}, $unprocessed_order_chunks) = $self->_group_over_selection (
204 $inner_from, $inner_select, $inner_attrs->{order_by}
205 );
206
207 $self->throw_exception (
208 'A required group_by clause could not be constructed automatically due to a complex '
209 . 'order_by criteria. Either order_by columns only (no functions) or construct a suitable '
210 . 'group_by by hand'
211 ) if $unprocessed_order_chunks;
212 }
213 else {
214 # We need to order by external columns and group at the same time
215 # so we can calculate the proper limit
216 # This doesn't really make sense in SQL, however from DBICs point
217 # of view is rather valid (order the leftmost objects by whatever
218 # criteria and get the offset/rows many). There is a way around
219 # this however in SQL - we simply tae the direction of each piece
220 # of the foreign order and convert them to MIN(X) for ASC or MAX(X)
221 # for DESC, and group_by the root columns. The end result should be
222 # exactly what we expect
223
224 # FIXME REMOVE LATER - (just a sanity check)
225 if (defined ( my $impostor = first
226 { $_ ne $root_alias }
227 keys %{ $inner_aliastypes->{selecting} }
228 ) ) {
229 $self->throw_exception(sprintf
230 'Unexpected inner selection during complex prefetch (%s)...',
231 join ', ', keys %{ $inner_aliastypes->{joining}{$impostor}{-seen_columns} || {} }
232 );
233 }
234
235 # supplement the main selection with pks if not already there,
236 # as they will have to be a part of the group_by to colapse
237 # things properly
238 my $cur_sel = { map { $_ => 1 } @$inner_select };
318e3d94 239
1e4f9fb3 240 my @pks = map { "$root_alias.$_" } $root_node->{-rsrc}->primary_columns
241 or $self->throw_exception( sprintf
242 'Unable to perform complex limited prefetch off %s without declared primary key',
243 $root_node->{-rsrc}->source_name,
244 );
245 for my $col (@pks) {
246 push @$inner_select, $col
247 unless $cur_sel->{$col}++;
248 }
249
250 # wrap any part of the order_by that "responds" to an ordering alias
251 # into a MIN/MAX
252 # FIXME - this code is a joke, will need to be completely rewritten in
253 # the DQ branch. But I need to push a POC here, otherwise the
254 # pesky tests won't pass
255 my $sql_maker = $self->sql_maker;
256 my ($lquote, $rquote, $sep) = map { quotemeta $_ } ($sql_maker->_quote_chars, $sql_maker->name_sep);
257 my $own_re = qr/ $lquote \Q$root_alias\E $rquote $sep | \b \Q$root_alias\E $sep /x;
e6977bbb 258 my @order_chunks = map { ref $_ eq 'ARRAY' ? $_ : [ $_ ] } $sql_maker->_order_by_chunks($attrs->{order_by});
259 my @new_order = map { \$_ } @order_chunks;
260 my $inner_columns_info = $self->_resolve_column_info($inner_from);
261
262 # loop through and replace stuff that is not "ours" with a min/max func
263 # everything is a literal at this point, since we are likely properly
264 # quoted and stuff
265 for my $i (0 .. $#new_order) {
266 my $chunk = $order_chunks[$i][0];
267
268 # skip ourselves
269 next if $chunk =~ $own_re;
270
cb3e87f5 271 ($chunk, my $is_desc) = $sql_maker->_split_order_chunk($chunk);
e6977bbb 272
273 # maybe our own unqualified column
318e3d94 274 my $ord_bit = (
275 $lquote and $sep and $chunk =~ /^ $lquote ([^$sep]+) $rquote $/x
276 ) ? $1 : $chunk;
277
e6977bbb 278 next if (
279 $ord_bit
280 and
281 $inner_columns_info->{$ord_bit}
282 and
283 $inner_columns_info->{$ord_bit}{-source_alias} eq $root_alias
284 );
285
286 $new_order[$i] = \[
1e4f9fb3 287 sprintf(
288 '%s(%s)%s',
289 ($is_desc ? 'MAX' : 'MIN'),
e6977bbb 290 $chunk,
1e4f9fb3 291 ($is_desc ? ' DESC' : ''),
292 ),
293 @ {$order_chunks[$i]} [ 1 .. $#{$order_chunks[$i]} ]
294 ];
295 }
296
e6977bbb 297 $inner_attrs->{order_by} = \@new_order;
298
299 # do not care about leftovers here - it will be all the functions
300 # we just created
1e4f9fb3 301 ($inner_attrs->{group_by}) = $self->_group_over_selection (
302 $inner_from, $inner_select, $inner_attrs->{order_by}
303 );
304 }
0a3441ee 305 }
d28bb90d 306
ea95892e 307 # we already optimized $inner_from above
97e130fa 308 # and already local()ized
309 $self->{_use_join_optimizer} = 0;
d28bb90d 310
ea95892e 311 # generate the subquery
6395604e 312 $self->_select_args_to_query (
ea95892e 313 $inner_from,
314 $inner_select,
315 $where,
316 $inner_attrs,
317 );
d28bb90d 318 };
319
320 # Generate the outer from - this is relatively easy (really just replace
321 # the join slot with the subquery), with a major caveat - we can not
322 # join anything that is non-selecting (not part of the prefetch), but at
323 # the same time is a multi-type relationship, as it will explode the result.
324 #
325 # There are two possibilities here
326 # - either the join is non-restricting, in which case we simply throw it away
327 # - it is part of the restrictions, in which case we need to collapse the outer
328 # result by tackling yet another group_by to the outside of the query
329
27e0370d 330 # work on a shallow copy
052e8431 331 $from = [ @$from ];
052e8431 332
d28bb90d 333 my @outer_from;
53c29913 334
27e0370d 335 # we may not be the head
97e130fa 336 if ($root_node_offset) {
27e0370d 337 # first generate the outer_from, up to the substitution point
97e130fa 338 @outer_from = splice @$from, 0, $root_node_offset;
27e0370d 339
340 push @outer_from, [
341 {
1e4f9fb3 342 -alias => $root_alias,
97e130fa 343 -rsrc => $root_node->{-rsrc},
1e4f9fb3 344 $root_alias => $inner_subq,
27e0370d 345 },
97e130fa 346 @{$from->[0]}[1 .. $#{$from->[0]}],
27e0370d 347 ];
348 }
349 else {
27e0370d 350 @outer_from = {
1e4f9fb3 351 -alias => $root_alias,
27e0370d 352 -rsrc => $root_node->{-rsrc},
1e4f9fb3 353 $root_alias => $inner_subq,
27e0370d 354 };
d28bb90d 355 }
356
97e130fa 357 shift @$from; # it's replaced in @outer_from already
358
ea95892e 359 # scan the *remaining* from spec against different attributes, and see which joins are needed
052e8431 360 # in what role
361 my $outer_aliastypes =
539ffe87 362 $self->_resolve_aliastypes_from_select_args( $from, $outer_select, $where, $outer_attrs );
052e8431 363
a4812caa 364 # unroll parents
1e4f9fb3 365 my ($outer_select_chain, @outer_nonselecting_chains) = map { +{
366 map { $_ => 1 } map { values %$_} map { @{$_->{-parents}} } values %{ $outer_aliastypes->{$_} || {} }
367 } } qw/selecting restricting grouping ordering/;
a4812caa 368
d28bb90d 369 # see what's left - throw away if not selecting/restricting
a4812caa 370 # also throw in a group_by if a non-selecting multiplier,
371 # to guard against cross-join explosions
36fd7f07 372 my $need_outer_group_by;
d28bb90d 373 while (my $j = shift @$from) {
374 my $alias = $j->[0]{-alias};
375
a4812caa 376 if (
377 $outer_select_chain->{$alias}
378 ) {
379 push @outer_from, $j
d28bb90d 380 }
1e4f9fb3 381 elsif (first { $_->{$alias} } @outer_nonselecting_chains ) {
d28bb90d 382 push @outer_from, $j;
a4812caa 383 $need_outer_group_by ||= $outer_aliastypes->{multiplying}{$alias} ? 1 : 0;
d28bb90d 384 }
385 }
386
1e4f9fb3 387 if ( $need_outer_group_by and $attrs->{_grouped_by_distinct} ) {
36fd7f07 388 my $unprocessed_order_chunks;
389 ($outer_attrs->{group_by}, $unprocessed_order_chunks) = $self->_group_over_selection (
390 \@outer_from, $outer_select, $outer_attrs->{order_by}
391 );
392
393 $self->throw_exception (
394 'A required group_by clause could not be constructed automatically due to a complex '
395 . 'order_by criteria. Either order_by columns only (no functions) or construct a suitable '
396 . 'group_by by hand'
397 ) if $unprocessed_order_chunks;
398
399 }
400
d28bb90d 401 # This is totally horrific - the $where ends up in both the inner and outer query
402 # Unfortunately not much can be done until SQLA2 introspection arrives, and even
403 # then if where conditions apply to the *right* side of the prefetch, you may have
404 # to both filter the inner select (e.g. to apply a limit) and then have to re-filter
405 # the outer select to exclude joins you didin't want in the first place
406 #
407 # OTOH it can be seen as a plus: <ash> (notes that this query would make a DBA cry ;)
408 return (\@outer_from, $outer_select, $where, $outer_attrs);
409}
410
1a736efb 411#
412# I KNOW THIS SUCKS! GET SQLA2 OUT THE DOOR SO THIS CAN DIE!
413#
ad630f4b 414# Due to a lack of SQLA2 we fall back to crude scans of all the
415# select/where/order/group attributes, in order to determine what
416# aliases are neded to fulfill the query. This information is used
417# throughout the code to prune unnecessary JOINs from the queries
418# in an attempt to reduce the execution time.
419# Although the method is pretty horrific, the worst thing that can
1a736efb 420# happen is for it to fail due to some scalar SQL, which in turn will
421# result in a vocal exception.
539ffe87 422sub _resolve_aliastypes_from_select_args {
052e8431 423 my ( $self, $from, $select, $where, $attrs ) = @_;
546f1cd9 424
ad630f4b 425 $self->throw_exception ('Unable to analyze custom {from}')
426 if ref $from ne 'ARRAY';
546f1cd9 427
ad630f4b 428 # what we will return
964a3c71 429 my $aliases_by_type;
546f1cd9 430
ad630f4b 431 # see what aliases are there to work with
432 my $alias_list;
539ffe87 433 for (@$from) {
434 my $j = $_;
ad630f4b 435 $j = $j->[0] if ref $j eq 'ARRAY';
539ffe87 436 my $al = $j->{-alias}
437 or next;
438
439 $alias_list->{$al} = $j;
97e130fa 440 $aliases_by_type->{multiplying}{$al} ||= { -parents => $j->{-join_path}||[] } if (
a4812caa 441 # not array == {from} head == can't be multiplying
442 ( ref($_) eq 'ARRAY' and ! $j->{-is_single} )
443 or
444 # a parent of ours is already a multiplier
445 ( grep { $aliases_by_type->{multiplying}{$_} } @{ $j->{-join_path}||[] } )
446 );
546f1cd9 447 }
546f1cd9 448
318e3d94 449 # get a column to source/alias map (including unambiguous unqualified ones)
1a736efb 450 my $colinfo = $self->_resolve_column_info ($from);
451
ad630f4b 452 # set up a botched SQLA
453 my $sql_maker = $self->sql_maker;
07f31d19 454
4c2b30d6 455 # these are throw away results, do not pollute the bind stack
4c2b30d6 456 local $sql_maker->{select_bind};
0542ec57 457 local $sql_maker->{where_bind};
458 local $sql_maker->{group_bind};
459 local $sql_maker->{having_bind};
97e130fa 460 local $sql_maker->{from_bind};
3f5b99fe 461
462 # we can't scan properly without any quoting (\b doesn't cut it
463 # everywhere), so unless there is proper quoting set - use our
464 # own weird impossible character.
465 # Also in the case of no quoting, we need to explicitly disable
466 # name_sep, otherwise sorry nasty legacy syntax like
467 # { 'count(foo.id)' => { '>' => 3 } } will stop working >:(
468 local $sql_maker->{quote_char} = $sql_maker->{quote_char};
469 local $sql_maker->{name_sep} = $sql_maker->{name_sep};
470
471 unless (defined $sql_maker->{quote_char} and length $sql_maker->{quote_char}) {
e493ecb2 472 $sql_maker->{quote_char} = ["\x00", "\xFF"];
473 # if we don't unset it we screw up retarded but unfortunately working
474 # 'MAX(foo.bar)' => { '>', 3 }
3f5b99fe 475 $sql_maker->{name_sep} = '';
476 }
477
478 my ($lquote, $rquote, $sep) = map { quotemeta $_ } ($sql_maker->_quote_chars, $sql_maker->name_sep);
07f31d19 479
1a736efb 480 # generate sql chunks
481 my $to_scan = {
482 restricting => [
483 $sql_maker->_recurse_where ($where),
1e4f9fb3 484 $sql_maker->_parse_rs_attrs ({ having => $attrs->{having} }),
485 ],
486 grouping => [
487 $sql_maker->_parse_rs_attrs ({ group_by => $attrs->{group_by} }),
1a736efb 488 ],
97e130fa 489 joining => [
490 $sql_maker->_recurse_from (
491 ref $from->[0] eq 'ARRAY' ? $from->[0][0] : $from->[0],
492 @{$from}[1 .. $#$from],
493 ),
494 ],
1a736efb 495 selecting => [
1a736efb 496 $sql_maker->_recurse_fields ($select),
1e4f9fb3 497 ],
498 ordering => [
499 map { $_->[0] } $self->_extract_order_criteria ($attrs->{order_by}, $sql_maker),
1a736efb 500 ],
501 };
07f31d19 502
1a736efb 503 # throw away empty chunks
504 $_ = [ map { $_ || () } @$_ ] for values %$to_scan;
07f31d19 505
318e3d94 506 # first see if we have any exact matches (qualified or unqualified)
507 for my $type (keys %$to_scan) {
508 for my $piece (@{$to_scan->{$type}}) {
509 if ($colinfo->{$piece} and my $alias = $colinfo->{$piece}{-source_alias}) {
510 $aliases_by_type->{$type}{$alias} ||= { -parents => $alias_list->{$alias}{-join_path}||[] };
511 $aliases_by_type->{$type}{$alias}{-seen_columns}{$colinfo->{$piece}{-fq_colname}} = $piece;
512 }
513 }
514 }
515
516 # now loop through all fully qualified columns and get the corresponding
1a736efb 517 # alias (should work even if they are in scalarrefs)
ad630f4b 518 for my $alias (keys %$alias_list) {
1a736efb 519 my $al_re = qr/
97e130fa 520 $lquote $alias $rquote $sep (?: $lquote ([^$rquote]+) $rquote )?
1a736efb 521 |
97e130fa 522 \b $alias \. ([^\s\)\($rquote]+)?
1a736efb 523 /x;
524
1a736efb 525 for my $type (keys %$to_scan) {
526 for my $piece (@{$to_scan->{$type}}) {
97e130fa 527 if (my @matches = $piece =~ /$al_re/g) {
528 $aliases_by_type->{$type}{$alias} ||= { -parents => $alias_list->{$alias}{-join_path}||[] };
1e4f9fb3 529 $aliases_by_type->{$type}{$alias}{-seen_columns}{"$alias.$_"} = "$alias.$_"
97e130fa 530 for grep { defined $_ } @matches;
531 }
1a736efb 532 }
ad630f4b 533 }
1a736efb 534 }
535
536 # now loop through unqualified column names, and try to locate them within
537 # the chunks
538 for my $col (keys %$colinfo) {
3f5b99fe 539 next if $col =~ / \. /x; # if column is qualified it was caught by the above
1a736efb 540
97e130fa 541 my $col_re = qr/ $lquote ($col) $rquote /x;
07f31d19 542
1a736efb 543 for my $type (keys %$to_scan) {
544 for my $piece (@{$to_scan->{$type}}) {
318e3d94 545 if ( my @matches = $piece =~ /$col_re/g) {
a4812caa 546 my $alias = $colinfo->{$col}{-source_alias};
97e130fa 547 $aliases_by_type->{$type}{$alias} ||= { -parents => $alias_list->{$alias}{-join_path}||[] };
1e4f9fb3 548 $aliases_by_type->{$type}{$alias}{-seen_columns}{"$alias.$_"} = $_
97e130fa 549 for grep { defined $_ } @matches;
a4812caa 550 }
1a736efb 551 }
07f31d19 552 }
553 }
554
555 # Add any non-left joins to the restriction list (such joins are indeed restrictions)
ad630f4b 556 for my $j (values %$alias_list) {
07f31d19 557 my $alias = $j->{-alias} or next;
97e130fa 558 $aliases_by_type->{restricting}{$alias} ||= { -parents => $j->{-join_path}||[] } if (
07f31d19 559 (not $j->{-join_type})
560 or
561 ($j->{-join_type} !~ /^left (?: \s+ outer)? $/xi)
562 );
563 }
564
1e4f9fb3 565 for (keys %$aliases_by_type) {
566 delete $aliases_by_type->{$_} unless keys %{$aliases_by_type->{$_}};
567 }
568
964a3c71 569 return $aliases_by_type;
07f31d19 570}
571
bac358c9 572# This is the engine behind { distinct => 1 }
0a3441ee 573sub _group_over_selection {
574 my ($self, $from, $select, $order_by) = @_;
575
576 my $rs_column_list = $self->_resolve_column_info ($from);
577
578 my (@group_by, %group_index);
579
36fd7f07 580 # the logic is: if it is a { func => val } we assume an aggregate,
581 # otherwise if \'...' or \[...] we assume the user knows what is
582 # going on thus group over it
0a3441ee 583 for (@$select) {
584 if (! ref($_) or ref ($_) ne 'HASH' ) {
585 push @group_by, $_;
586 $group_index{$_}++;
587 if ($rs_column_list->{$_} and $_ !~ /\./ ) {
588 # add a fully qualified version as well
589 $group_index{"$rs_column_list->{$_}{-source_alias}.$_"}++;
590 }
07f31d19 591 }
592 }
ad630f4b 593
0a3441ee 594 # add any order_by parts that are not already present in the group_by
595 # we need to be careful not to add any named functions/aggregates
bac358c9 596 # i.e. order_by => [ ... { count => 'foo' } ... ]
14e26c5f 597 my @leftovers;
bac358c9 598 for ($self->_extract_order_criteria($order_by)) {
0a3441ee 599 # only consider real columns (for functions the user got to do an explicit group_by)
14e26c5f 600 if (@$_ != 1) {
601 push @leftovers, $_;
602 next;
603 }
bac358c9 604 my $chunk = $_->[0];
14e26c5f 605 my $colinfo = $rs_column_list->{$chunk} or do {
606 push @leftovers, $_;
607 next;
608 };
0a3441ee 609
610 $chunk = "$colinfo->{-source_alias}.$chunk" if $chunk !~ /\./;
611 push @group_by, $chunk unless $group_index{$chunk}++;
612 }
613
14e26c5f 614 return wantarray
615 ? (\@group_by, (@leftovers ? \@leftovers : undef) )
616 : \@group_by
617 ;
07f31d19 618}
619
d28bb90d 620sub _resolve_ident_sources {
621 my ($self, $ident) = @_;
622
623 my $alias2source = {};
624 my $rs_alias;
625
626 # the reason this is so contrived is that $ident may be a {from}
627 # structure, specifying multiple tables to join
6298a324 628 if ( blessed $ident && $ident->isa("DBIx::Class::ResultSource") ) {
d28bb90d 629 # this is compat mode for insert/update/delete which do not deal with aliases
630 $alias2source->{me} = $ident;
631 $rs_alias = 'me';
632 }
633 elsif (ref $ident eq 'ARRAY') {
634
635 for (@$ident) {
636 my $tabinfo;
637 if (ref $_ eq 'HASH') {
638 $tabinfo = $_;
639 $rs_alias = $tabinfo->{-alias};
640 }
641 if (ref $_ eq 'ARRAY' and ref $_->[0] eq 'HASH') {
642 $tabinfo = $_->[0];
643 }
644
4376a157 645 $alias2source->{$tabinfo->{-alias}} = $tabinfo->{-rsrc}
646 if ($tabinfo->{-rsrc});
d28bb90d 647 }
648 }
649
650 return ($alias2source, $rs_alias);
651}
652
653# Takes $ident, \@column_names
654#
655# returns { $column_name => \%column_info, ... }
656# also note: this adds -result_source => $rsrc to the column info
657#
09e14fdc 658# If no columns_names are supplied returns info about *all* columns
659# for all sources
d28bb90d 660sub _resolve_column_info {
661 my ($self, $ident, $colnames) = @_;
662 my ($alias2src, $root_alias) = $self->_resolve_ident_sources($ident);
663
52416317 664 my (%seen_cols, @auto_colnames);
d28bb90d 665
666 # compile a global list of column names, to be able to properly
667 # disambiguate unqualified column names (if at all possible)
668 for my $alias (keys %$alias2src) {
669 my $rsrc = $alias2src->{$alias};
670 for my $colname ($rsrc->columns) {
671 push @{$seen_cols{$colname}}, $alias;
3f5b99fe 672 push @auto_colnames, "$alias.$colname" unless $colnames;
d28bb90d 673 }
674 }
675
09e14fdc 676 $colnames ||= [
677 @auto_colnames,
678 grep { @{$seen_cols{$_}} == 1 } (keys %seen_cols),
679 ];
680
52416317 681 my (%return, $colinfos);
d28bb90d 682 foreach my $col (@$colnames) {
52416317 683 my ($source_alias, $colname) = $col =~ m/^ (?: ([^\.]+) \. )? (.+) $/x;
d28bb90d 684
52416317 685 # if the column was seen exactly once - we know which rsrc it came from
686 $source_alias ||= $seen_cols{$colname}[0]
687 if ($seen_cols{$colname} and @{$seen_cols{$colname}} == 1);
d28bb90d 688
52416317 689 next unless $source_alias;
690
691 my $rsrc = $alias2src->{$source_alias}
692 or next;
693
694 $return{$col} = {
6395604e 695 %{
696 ( $colinfos->{$source_alias} ||= $rsrc->columns_info )->{$colname}
697 ||
698 $self->throw_exception(
699 "No such column '$colname' on source " . $rsrc->source_name
700 );
701 },
d28bb90d 702 -result_source => $rsrc,
52416317 703 -source_alias => $source_alias,
81bf295c 704 -fq_colname => $col eq $colname ? "$source_alias.$col" : $col,
705 -colname => $colname,
d28bb90d 706 };
81bf295c 707
708 $return{"$source_alias.$colname"} = $return{$col} if $col eq $colname;
d28bb90d 709 }
710
711 return \%return;
712}
713
289ac713 714# The DBIC relationship chaining implementation is pretty simple - every
715# new related_relationship is pushed onto the {from} stack, and the {select}
716# window simply slides further in. This means that when we count somewhere
717# in the middle, we got to make sure that everything in the join chain is an
718# actual inner join, otherwise the count will come back with unpredictable
719# results (a resultset may be generated with _some_ rows regardless of if
720# the relation which the $rs currently selects has rows or not). E.g.
721# $artist_rs->cds->count - normally generates:
722# SELECT COUNT( * ) FROM artist me LEFT JOIN cd cds ON cds.artist = me.artistid
723# which actually returns the number of artists * (number of cds || 1)
724#
725# So what we do here is crawl {from}, determine if the current alias is at
726# the top of the stack, and if not - make sure the chain is inner-joined down
727# to the root.
728#
31a8aaaf 729sub _inner_join_to_node {
289ac713 730 my ($self, $from, $alias) = @_;
731
732 # subqueries and other oddness are naturally not supported
733 return $from if (
734 ref $from ne 'ARRAY'
735 ||
736 @$from <= 1
737 ||
738 ref $from->[0] ne 'HASH'
739 ||
740 ! $from->[0]{-alias}
741 ||
7eb76996 742 $from->[0]{-alias} eq $alias # this last bit means $alias is the head of $from - nothing to do
289ac713 743 );
744
745 # find the current $alias in the $from structure
746 my $switch_branch;
747 JOINSCAN:
748 for my $j (@{$from}[1 .. $#$from]) {
749 if ($j->[0]{-alias} eq $alias) {
750 $switch_branch = $j->[0]{-join_path};
751 last JOINSCAN;
752 }
753 }
754
7eb76996 755 # something else went quite wrong
289ac713 756 return $from unless $switch_branch;
757
758 # So it looks like we will have to switch some stuff around.
759 # local() is useless here as we will be leaving the scope
760 # anyway, and deep cloning is just too fucking expensive
8273e845 761 # So replace the first hashref in the node arrayref manually
289ac713 762 my @new_from = ($from->[0]);
faeb2407 763 my $sw_idx = { map { (values %$_), 1 } @$switch_branch }; #there's one k/v per join-path
289ac713 764
765 for my $j (@{$from}[1 .. $#$from]) {
766 my $jalias = $j->[0]{-alias};
767
768 if ($sw_idx->{$jalias}) {
769 my %attrs = %{$j->[0]};
770 delete $attrs{-join_type};
771 push @new_from, [
772 \%attrs,
773 @{$j}[ 1 .. $#$j ],
774 ];
775 }
776 else {
777 push @new_from, $j;
778 }
779 }
780
781 return \@new_from;
782}
783
bac358c9 784sub _extract_order_criteria {
1a736efb 785 my ($self, $order_by, $sql_maker) = @_;
c0748280 786
1a736efb 787 my $parser = sub {
e6977bbb 788 my ($sql_maker, $order_by, $orig_quote_chars) = @_;
c0748280 789
1a736efb 790 return scalar $sql_maker->_order_by_chunks ($order_by)
791 unless wantarray;
c0748280 792
e6977bbb 793 my ($lq, $rq, $sep) = map { quotemeta($_) } (
794 ($orig_quote_chars ? @$orig_quote_chars : $sql_maker->_quote_chars),
795 $sql_maker->name_sep
796 );
797
1a736efb 798 my @chunks;
bac358c9 799 for ($sql_maker->_order_by_chunks ($order_by) ) {
e6977bbb 800 my $chunk = ref $_ ? [ @$_ ] : [ $_ ];
cb3e87f5 801 ($chunk->[0]) = $sql_maker->_split_order_chunk($chunk->[0]);
e6977bbb 802
803 # order criteria may have come back pre-quoted (literals and whatnot)
804 # this is fragile, but the best we can currently do
805 $chunk->[0] =~ s/^ $lq (.+?) $rq $sep $lq (.+?) $rq $/"$1.$2"/xe
806 or $chunk->[0] =~ s/^ $lq (.+) $rq $/$1/x;
807
1a736efb 808 push @chunks, $chunk;
bac6c4fb 809 }
1a736efb 810
811 return @chunks;
812 };
813
814 if ($sql_maker) {
815 return $parser->($sql_maker, $order_by);
bac6c4fb 816 }
817 else {
1a736efb 818 $sql_maker = $self->sql_maker;
e6977bbb 819
820 # pass these in to deal with literals coming from
821 # the user or the deep guts of prefetch
822 my $orig_quote_chars = [$sql_maker->_quote_chars];
823
1a736efb 824 local $sql_maker->{quote_char};
e6977bbb 825 return $parser->($sql_maker, $order_by, $orig_quote_chars);
bac6c4fb 826 }
bac6c4fb 827}
828
7cec4356 829sub _order_by_is_stable {
5f11e54f 830 my ($self, $ident, $order_by, $where) = @_;
c0748280 831
5f11e54f 832 my $colinfo = $self->_resolve_column_info($ident, [
833 (map { $_->[0] } $self->_extract_order_criteria($order_by)),
834 $where ? @{$self->_extract_fixed_condition_columns($where)} :(),
835 ]);
c0748280 836
7cec4356 837 return undef unless keys %$colinfo;
838
839 my $cols_per_src;
840 $cols_per_src->{$_->{-source_alias}}{$_->{-colname}} = $_ for values %$colinfo;
841
842 for (values %$cols_per_src) {
843 my $src = (values %$_)[0]->{-result_source};
844 return 1 if $src->_identifying_column_set($_);
c0748280 845 }
846
7cec4356 847 return undef;
848}
849
0e81e691 850# this is almost identical to the above, except it accepts only
851# a single rsrc, and will succeed only if the first portion of the order
852# by is stable.
853# returns that portion as a colinfo hashref on success
854sub _main_source_order_by_portion_is_stable {
855 my ($self, $main_rsrc, $order_by, $where) = @_;
856
857 die "Huh... I expect a blessed result_source..."
858 if ref($main_rsrc) eq 'ARRAY';
859
860 my @ord_cols = map
861 { $_->[0] }
862 ( $self->_extract_order_criteria($order_by) )
863 ;
864 return unless @ord_cols;
865
318e3d94 866 my $colinfos = $self->_resolve_column_info($main_rsrc);
867
0e81e691 868 for (0 .. $#ord_cols) {
869 if (
870 ! $colinfos->{$ord_cols[$_]}
871 or
872 $colinfos->{$ord_cols[$_]}{-result_source} != $main_rsrc
873 ) {
874 $#ord_cols = $_ - 1;
875 last;
876 }
877 }
878
879 # we just truncated it above
880 return unless @ord_cols;
881
0e81e691 882 my $order_portion_ci = { map {
883 $colinfos->{$_}{-colname} => $colinfos->{$_},
884 $colinfos->{$_}{-fq_colname} => $colinfos->{$_},
885 } @ord_cols };
886
318e3d94 887 # since all we check here are the start of the order_by belonging to the
888 # top level $rsrc, a present identifying set will mean that the resultset
889 # is ordered by its leftmost table in a stable manner
890 #
891 # RV of _identifying_column_set contains unqualified names only
892 my $unqualified_idset = $main_rsrc->_identifying_column_set({
893 ( $where ? %{
894 $self->_resolve_column_info(
895 $main_rsrc, $self->_extract_fixed_condition_columns($where)
896 )
897 } : () ),
898 %$order_portion_ci
899 }) or return;
900
901 my $ret_info;
902 my %unqualified_idcols_from_order = map {
903 $order_portion_ci->{$_} ? ( $_ => $order_portion_ci->{$_} ) : ()
904 } @$unqualified_idset;
905
906 # extra optimization - cut the order_by at the end of the identifying set
907 # (just in case the user was stupid and overlooked the obvious)
908 for my $i (0 .. $#ord_cols) {
909 my $col = $ord_cols[$i];
910 my $unqualified_colname = $order_portion_ci->{$col}{-colname};
911 $ret_info->{$col} = { %{$order_portion_ci->{$col}}, -idx_in_order_subset => $i };
912 delete $unqualified_idcols_from_order{$ret_info->{$col}{-colname}};
913
914 # we didn't reach the end of the identifying portion yet
915 return $ret_info unless keys %unqualified_idcols_from_order;
916 }
0e81e691 917
318e3d94 918 die 'How did we get here...';
0e81e691 919}
920
5f11e54f 921# returns an arrayref of column names which *definitely* have som
922# sort of non-nullable equality requested in the given condition
923# specification. This is used to figure out if a resultset is
924# constrained to a column which is part of a unique constraint,
925# which in turn allows us to better predict how ordering will behave
926# etc.
927#
928# this is a rudimentary, incomplete, and error-prone extractor
929# however this is OK - it is conservative, and if we can not find
930# something that is in fact there - the stack will recover gracefully
931# Also - DQ and the mst it rode in on will save us all RSN!!!
932sub _extract_fixed_condition_columns {
933 my ($self, $where, $nested) = @_;
934
935 return unless ref $where eq 'HASH';
936
937 my @cols;
938 for my $lhs (keys %$where) {
939 if ($lhs =~ /^\-and$/i) {
940 push @cols, ref $where->{$lhs} eq 'ARRAY'
941 ? ( map { $self->_extract_fixed_condition_columns($_, 1) } @{$where->{$lhs}} )
942 : $self->_extract_fixed_condition_columns($where->{$lhs}, 1)
943 ;
944 }
945 elsif ($lhs !~ /^\-/) {
946 my $val = $where->{$lhs};
947
948 push @cols, $lhs if (defined $val and (
949 ! ref $val
950 or
951 (ref $val eq 'HASH' and keys %$val == 1 and defined $val->{'='})
952 ));
953 }
954 }
955 return $nested ? @cols : \@cols;
c0748280 956}
bac6c4fb 957
d28bb90d 9581;