switch _resolve_aliastypes_from_select_args to calling slightly saner methods
[dbsrgits/DBIx-Class.git] / lib / DBIx / Class / Storage / DBIHacks.pm
CommitLineData
c443438f 1package #hide from PAUSE
2 DBIx::Class::Storage::DBIHacks;
d28bb90d 3
4#
5# This module contains code that should never have seen the light of day,
6# does not belong in the Storage, or is otherwise unfit for public
6a6394f1 7# display. The arrival of SQLA2 should immediately obsolete 90% of this
d28bb90d 8#
9
10use strict;
11use warnings;
12
13use base 'DBIx::Class::Storage';
14use mro 'c3';
15
6298a324 16use List::Util 'first';
17use Scalar::Util 'blessed';
ea5c7509 18use Sub::Name 'subname';
10cef607 19use Data::Query::ExprHelpers;
6298a324 20use namespace::clean;
d28bb90d 21
22#
052e8431 23# This code will remove non-selecting/non-restricting joins from
4b1b5ea3 24# {from} specs, aiding the RDBMS query optimizer
052e8431 25#
26sub _prune_unused_joins {
ea95892e 27 my $self = shift;
437a9cfa 28 my ($from, $select, $where, $attrs) = @_;
052e8431 29
ea95892e 30 return $from unless $self->_use_join_optimizer;
31
052e8431 32 if (ref $from ne 'ARRAY' || ref $from->[0] ne 'HASH' || ref $from->[1] ne 'ARRAY') {
33 return $from; # only standard {from} specs are supported
34 }
35
4b1b5ea3 36 my $aliastypes = $self->_resolve_aliastypes_from_select_args(@_);
37
a6ef93cb 38 my $orig_joins = delete $aliastypes->{joining};
39 my $orig_multiplying = $aliastypes->{multiplying};
97e130fa 40
4b1b5ea3 41 # a grouped set will not be affected by amount of rows. Thus any
42 # {multiplying} joins can go
97e130fa 43 delete $aliastypes->{multiplying}
437a9cfa 44 if $attrs->{_force_prune_multiplying_joins} or $attrs->{group_by};
4b1b5ea3 45
052e8431 46 my @newfrom = $from->[0]; # FROM head is always present
47
a4812caa 48 my %need_joins;
97e130fa 49
a4812caa 50 for (values %$aliastypes) {
51 # add all requested aliases
52 $need_joins{$_} = 1 for keys %$_;
53
54 # add all their parents (as per joinpath which is an AoH { table => alias })
97e130fa 55 $need_joins{$_} = 1 for map { values %$_ } map { @{$_->{-parents}} } values %$_;
a4812caa 56 }
97e130fa 57
052e8431 58 for my $j (@{$from}[1..$#$from]) {
539ffe87 59 push @newfrom, $j if (
a6ef93cb 60 (! defined $j->[0]{-alias}) # legacy crap
539ffe87 61 ||
62 $need_joins{$j->[0]{-alias}}
63 );
052e8431 64 }
65
a6ef93cb 66 return ( \@newfrom, {
67 multiplying => { map { $need_joins{$_} ? ($_ => $orig_multiplying->{$_}) : () } keys %$orig_multiplying },
68 %$aliastypes,
69 joining => { map { $_ => $orig_joins->{$_} } keys %need_joins },
70 } );
052e8431 71}
72
052e8431 73#
d28bb90d 74# This is the code producing joined subqueries like:
8273e845 75# SELECT me.*, other.* FROM ( SELECT me.* FROM ... ) JOIN other ON ...
d28bb90d 76#
77sub _adjust_select_args_for_complex_prefetch {
78 my ($self, $from, $select, $where, $attrs) = @_;
79
d28bb90d 80 $self->throw_exception ('Complex prefetches are not supported on resultsets with a custom from attribute')
81 if (ref $from ne 'ARRAY' || ref $from->[0] ne 'HASH' || ref $from->[1] ne 'ARRAY');
82
1e4f9fb3 83 my $root_alias = $attrs->{alias};
84
d28bb90d 85 # generate inner/outer attribute lists, remove stuff that doesn't apply
86 my $outer_attrs = { %$attrs };
5b309063 87 delete @{$outer_attrs}{qw(where bind rows offset group_by _grouped_by_distinct having)};
d28bb90d 88
186ba34c 89 my $inner_attrs = { %$attrs };
5b309063 90 delete @{$inner_attrs}{qw(from for collapse select as _related_results_construction)};
d28bb90d 91
4df1400e 92 # there is no point of ordering the insides if there is no limit
93 delete $inner_attrs->{order_by} if (
94 delete $inner_attrs->{_order_is_artificial}
95 or
96 ! $inner_attrs->{rows}
97 );
946f6260 98
d28bb90d 99 # generate the inner/outer select lists
100 # for inside we consider only stuff *not* brought in by the prefetch
101 # on the outside we substitute any function for its alias
102 my $outer_select = [ @$select ];
97e130fa 103 my $inner_select;
36fd7f07 104
97e130fa 105 my ($root_node, $root_node_offset);
27e0370d 106
107 for my $i (0 .. $#$from) {
108 my $node = $from->[$i];
109 my $h = (ref $node eq 'HASH') ? $node
110 : (ref $node eq 'ARRAY' and ref $node->[0] eq 'HASH') ? $node->[0]
111 : next
112 ;
113
1e4f9fb3 114 if ( ($h->{-alias}||'') eq $root_alias and $h->{-rsrc} ) {
97e130fa 115 $root_node = $h;
116 $root_node_offset = $i;
27e0370d 117 last;
118 }
119 }
120
121 $self->throw_exception ('Complex prefetches are not supported on resultsets with a custom from attribute')
97e130fa 122 unless $root_node;
27e0370d 123
124 # use the heavy duty resolver to take care of aliased/nonaliased naming
125 my $colinfo = $self->_resolve_column_info($from);
126 my $selected_root_columns;
127
1e4f9fb3 128 for my $i (0 .. $#$outer_select) {
d28bb90d 129 my $sel = $outer_select->[$i];
130
1e4f9fb3 131 next if (
132 $colinfo->{$sel} and $colinfo->{$sel}{-source_alias} ne $root_alias
133 );
134
d28bb90d 135 if (ref $sel eq 'HASH' ) {
136 $sel->{-as} ||= $attrs->{as}[$i];
1e4f9fb3 137 $outer_select->[$i] = join ('.', $root_alias, ($sel->{-as} || "inner_column_$i") );
d28bb90d 138 }
27e0370d 139 elsif (! ref $sel and my $ci = $colinfo->{$sel}) {
140 $selected_root_columns->{$ci->{-colname}} = 1;
141 }
d28bb90d 142
143 push @$inner_select, $sel;
bb9bffea 144
145 push @{$inner_attrs->{as}}, $attrs->{as}[$i];
d28bb90d 146 }
147
97e130fa 148 # We will need to fetch all native columns in the inner subquery, which may
149 # be a part of an *outer* join condition, or an order_by (which needs to be
150 # preserved outside)
151 # We can not just fetch everything because a potential has_many restricting
152 # join collapse *will not work* on heavy data types.
153 my $connecting_aliastypes = $self->_resolve_aliastypes_from_select_args(
560978e2 154 $from,
97e130fa 155 [],
156 $where,
157 $inner_attrs
158 );
159
160 for (sort map { keys %{$_->{-seen_columns}||{}} } map { values %$_ } values %$connecting_aliastypes) {
161 my $ci = $colinfo->{$_} or next;
162 if (
1e4f9fb3 163 $ci->{-source_alias} eq $root_alias
97e130fa 164 and
165 ! $selected_root_columns->{$ci->{-colname}}++
166 ) {
167 # adding it to both to keep limits not supporting dark selectors happy
168 push @$inner_select, $ci->{-fq_colname};
169 push @{$inner_attrs->{as}}, $ci->{-fq_colname};
27e0370d 170 }
171 }
172
ea95892e 173 # construct the inner $from and lock it in a subquery
48580715 174 # we need to prune first, because this will determine if we need a group_by below
97e130fa 175 # throw away all non-selecting, non-restricting multijoins
176 # (since we def. do not care about multiplication those inside the subquery)
6395604e 177 my $inner_subq = do {
ea95892e 178
179 # must use it here regardless of user requests
180 local $self->{_use_join_optimizer} = 1;
181
97e130fa 182 # throw away multijoins since we def. do not care about those inside the subquery
a6ef93cb 183 my ($inner_from, $inner_aliastypes) = $self->_prune_unused_joins ($from, $inner_select, $where, {
437a9cfa 184 %$inner_attrs, _force_prune_multiplying_joins => 1
185 });
ea95892e 186
1e4f9fb3 187 # uh-oh a multiplier (which is not us) left in, this is a problem
0a3441ee 188 if (
1e4f9fb3 189 $inner_aliastypes->{multiplying}
190 and
560978e2 191 # if there are user-supplied groups - assume user knows wtf they are up to
192 ( ! $inner_aliastypes->{grouping} or $inner_attrs->{_grouped_by_distinct} )
0a3441ee 193 and
1e4f9fb3 194 my @multipliers = grep { $_ ne $root_alias } keys %{$inner_aliastypes->{multiplying}}
0a3441ee 195 ) {
1e4f9fb3 196
197 # if none of the multipliers came from an order_by (guaranteed to have been combined
4a0eed52 198 # with a limit) - easy - just slap a group_by to simulate a collapse and be on our way
1e4f9fb3 199 if (
200 ! $inner_aliastypes->{ordering}
201 or
202 ! first { $inner_aliastypes->{ordering}{$_} } @multipliers
203 ) {
318e3d94 204
1e4f9fb3 205 my $unprocessed_order_chunks;
560978e2 206 ($inner_attrs->{group_by}, $unprocessed_order_chunks) = $self->_group_over_selection ({
207 %$inner_attrs,
208 from => $inner_from,
209 select => $inner_select,
210 });
1e4f9fb3 211
212 $self->throw_exception (
213 'A required group_by clause could not be constructed automatically due to a complex '
214 . 'order_by criteria. Either order_by columns only (no functions) or construct a suitable '
215 . 'group_by by hand'
216 ) if $unprocessed_order_chunks;
217 }
218 else {
219 # We need to order by external columns and group at the same time
220 # so we can calculate the proper limit
221 # This doesn't really make sense in SQL, however from DBICs point
222 # of view is rather valid (order the leftmost objects by whatever
223 # criteria and get the offset/rows many). There is a way around
224 # this however in SQL - we simply tae the direction of each piece
225 # of the foreign order and convert them to MIN(X) for ASC or MAX(X)
226 # for DESC, and group_by the root columns. The end result should be
227 # exactly what we expect
228
1e4f9fb3 229 # supplement the main selection with pks if not already there,
4a0eed52 230 # as they will have to be a part of the group_by to collapse
1e4f9fb3 231 # things properly
232 my $cur_sel = { map { $_ => 1 } @$inner_select };
318e3d94 233
1e4f9fb3 234 my @pks = map { "$root_alias.$_" } $root_node->{-rsrc}->primary_columns
235 or $self->throw_exception( sprintf
236 'Unable to perform complex limited prefetch off %s without declared primary key',
237 $root_node->{-rsrc}->source_name,
238 );
239 for my $col (@pks) {
240 push @$inner_select, $col
241 unless $cur_sel->{$col}++;
242 }
243
244 # wrap any part of the order_by that "responds" to an ordering alias
245 # into a MIN/MAX
246 # FIXME - this code is a joke, will need to be completely rewritten in
247 # the DQ branch. But I need to push a POC here, otherwise the
248 # pesky tests won't pass
249 my $sql_maker = $self->sql_maker;
250 my ($lquote, $rquote, $sep) = map { quotemeta $_ } ($sql_maker->_quote_chars, $sql_maker->name_sep);
251 my $own_re = qr/ $lquote \Q$root_alias\E $rquote $sep | \b \Q$root_alias\E $sep /x;
e6977bbb 252 my @order_chunks = map { ref $_ eq 'ARRAY' ? $_ : [ $_ ] } $sql_maker->_order_by_chunks($attrs->{order_by});
253 my @new_order = map { \$_ } @order_chunks;
254 my $inner_columns_info = $self->_resolve_column_info($inner_from);
255
256 # loop through and replace stuff that is not "ours" with a min/max func
257 # everything is a literal at this point, since we are likely properly
258 # quoted and stuff
259 for my $i (0 .. $#new_order) {
260 my $chunk = $order_chunks[$i][0];
261
262 # skip ourselves
263 next if $chunk =~ $own_re;
264
cb3e87f5 265 ($chunk, my $is_desc) = $sql_maker->_split_order_chunk($chunk);
e6977bbb 266
267 # maybe our own unqualified column
318e3d94 268 my $ord_bit = (
269 $lquote and $sep and $chunk =~ /^ $lquote ([^$sep]+) $rquote $/x
270 ) ? $1 : $chunk;
271
e6977bbb 272 next if (
273 $ord_bit
274 and
275 $inner_columns_info->{$ord_bit}
276 and
277 $inner_columns_info->{$ord_bit}{-source_alias} eq $root_alias
278 );
279
280 $new_order[$i] = \[
1e4f9fb3 281 sprintf(
282 '%s(%s)%s',
283 ($is_desc ? 'MAX' : 'MIN'),
e6977bbb 284 $chunk,
1e4f9fb3 285 ($is_desc ? ' DESC' : ''),
286 ),
287 @ {$order_chunks[$i]} [ 1 .. $#{$order_chunks[$i]} ]
288 ];
289 }
290
e6977bbb 291 $inner_attrs->{order_by} = \@new_order;
292
293 # do not care about leftovers here - it will be all the functions
294 # we just created
560978e2 295 ($inner_attrs->{group_by}) = $self->_group_over_selection ({
296 %$inner_attrs,
297 from => $inner_from,
298 select => $inner_select,
299 });
1e4f9fb3 300 }
0a3441ee 301 }
d28bb90d 302
ea95892e 303 # we already optimized $inner_from above
97e130fa 304 # and already local()ized
305 $self->{_use_join_optimizer} = 0;
d28bb90d 306
ea95892e 307 # generate the subquery
6395604e 308 $self->_select_args_to_query (
ea95892e 309 $inner_from,
310 $inner_select,
311 $where,
312 $inner_attrs,
313 );
d28bb90d 314 };
315
316 # Generate the outer from - this is relatively easy (really just replace
317 # the join slot with the subquery), with a major caveat - we can not
318 # join anything that is non-selecting (not part of the prefetch), but at
319 # the same time is a multi-type relationship, as it will explode the result.
320 #
321 # There are two possibilities here
322 # - either the join is non-restricting, in which case we simply throw it away
323 # - it is part of the restrictions, in which case we need to collapse the outer
324 # result by tackling yet another group_by to the outside of the query
325
27e0370d 326 # work on a shallow copy
052e8431 327 $from = [ @$from ];
052e8431 328
d28bb90d 329 my @outer_from;
53c29913 330
27e0370d 331 # we may not be the head
97e130fa 332 if ($root_node_offset) {
560978e2 333 # first generate the outer_from, up and including the substitution point
97e130fa 334 @outer_from = splice @$from, 0, $root_node_offset;
27e0370d 335
336 push @outer_from, [
337 {
1e4f9fb3 338 -alias => $root_alias,
97e130fa 339 -rsrc => $root_node->{-rsrc},
1e4f9fb3 340 $root_alias => $inner_subq,
27e0370d 341 },
97e130fa 342 @{$from->[0]}[1 .. $#{$from->[0]}],
27e0370d 343 ];
344 }
345 else {
27e0370d 346 @outer_from = {
1e4f9fb3 347 -alias => $root_alias,
27e0370d 348 -rsrc => $root_node->{-rsrc},
1e4f9fb3 349 $root_alias => $inner_subq,
27e0370d 350 };
d28bb90d 351 }
352
560978e2 353 shift @$from; # what we just replaced above
97e130fa 354
ea95892e 355 # scan the *remaining* from spec against different attributes, and see which joins are needed
052e8431 356 # in what role
975b573a 357 my $outer_aliastypes = $outer_attrs->{_aliastypes} =
539ffe87 358 $self->_resolve_aliastypes_from_select_args( $from, $outer_select, $where, $outer_attrs );
052e8431 359
a4812caa 360 # unroll parents
1e4f9fb3 361 my ($outer_select_chain, @outer_nonselecting_chains) = map { +{
362 map { $_ => 1 } map { values %$_} map { @{$_->{-parents}} } values %{ $outer_aliastypes->{$_} || {} }
363 } } qw/selecting restricting grouping ordering/;
a4812caa 364
d28bb90d 365 # see what's left - throw away if not selecting/restricting
a4812caa 366 # also throw in a group_by if a non-selecting multiplier,
367 # to guard against cross-join explosions
36fd7f07 368 my $need_outer_group_by;
d28bb90d 369 while (my $j = shift @$from) {
370 my $alias = $j->[0]{-alias};
371
a4812caa 372 if (
373 $outer_select_chain->{$alias}
374 ) {
375 push @outer_from, $j
d28bb90d 376 }
1e4f9fb3 377 elsif (first { $_->{$alias} } @outer_nonselecting_chains ) {
d28bb90d 378 push @outer_from, $j;
a4812caa 379 $need_outer_group_by ||= $outer_aliastypes->{multiplying}{$alias} ? 1 : 0;
d28bb90d 380 }
381 }
382
1e4f9fb3 383 if ( $need_outer_group_by and $attrs->{_grouped_by_distinct} ) {
36fd7f07 384 my $unprocessed_order_chunks;
560978e2 385 ($outer_attrs->{group_by}, $unprocessed_order_chunks) = $self->_group_over_selection ({
386 %$outer_attrs,
387 from => \@outer_from,
388 select => $outer_select,
389 });
36fd7f07 390
391 $self->throw_exception (
392 'A required group_by clause could not be constructed automatically due to a complex '
393 . 'order_by criteria. Either order_by columns only (no functions) or construct a suitable '
394 . 'group_by by hand'
395 ) if $unprocessed_order_chunks;
396
397 }
398
d28bb90d 399 # This is totally horrific - the $where ends up in both the inner and outer query
400 # Unfortunately not much can be done until SQLA2 introspection arrives, and even
401 # then if where conditions apply to the *right* side of the prefetch, you may have
402 # to both filter the inner select (e.g. to apply a limit) and then have to re-filter
4a0eed52 403 # the outer select to exclude joins you didn't want in the first place
d28bb90d 404 #
405 # OTOH it can be seen as a plus: <ash> (notes that this query would make a DBA cry ;)
406 return (\@outer_from, $outer_select, $where, $outer_attrs);
407}
408
1a736efb 409#
410# I KNOW THIS SUCKS! GET SQLA2 OUT THE DOOR SO THIS CAN DIE!
411#
ad630f4b 412# Due to a lack of SQLA2 we fall back to crude scans of all the
413# select/where/order/group attributes, in order to determine what
4a0eed52 414# aliases are needed to fulfill the query. This information is used
ad630f4b 415# throughout the code to prune unnecessary JOINs from the queries
416# in an attempt to reduce the execution time.
417# Although the method is pretty horrific, the worst thing that can
1a736efb 418# happen is for it to fail due to some scalar SQL, which in turn will
419# result in a vocal exception.
539ffe87 420sub _resolve_aliastypes_from_select_args {
052e8431 421 my ( $self, $from, $select, $where, $attrs ) = @_;
546f1cd9 422
ad630f4b 423 $self->throw_exception ('Unable to analyze custom {from}')
424 if ref $from ne 'ARRAY';
546f1cd9 425
ad630f4b 426 # what we will return
964a3c71 427 my $aliases_by_type;
546f1cd9 428
ad630f4b 429 # see what aliases are there to work with
430 my $alias_list;
539ffe87 431 for (@$from) {
432 my $j = $_;
ad630f4b 433 $j = $j->[0] if ref $j eq 'ARRAY';
539ffe87 434 my $al = $j->{-alias}
435 or next;
436
437 $alias_list->{$al} = $j;
97e130fa 438 $aliases_by_type->{multiplying}{$al} ||= { -parents => $j->{-join_path}||[] } if (
a4812caa 439 # not array == {from} head == can't be multiplying
440 ( ref($_) eq 'ARRAY' and ! $j->{-is_single} )
441 or
442 # a parent of ours is already a multiplier
443 ( grep { $aliases_by_type->{multiplying}{$_} } @{ $j->{-join_path}||[] } )
444 );
546f1cd9 445 }
546f1cd9 446
318e3d94 447 # get a column to source/alias map (including unambiguous unqualified ones)
1a736efb 448 my $colinfo = $self->_resolve_column_info ($from);
449
ad630f4b 450 # set up a botched SQLA
451 my $sql_maker = $self->sql_maker;
07f31d19 452
4c2b30d6 453 # these are throw away results, do not pollute the bind stack
4c2b30d6 454 local $sql_maker->{select_bind};
0542ec57 455 local $sql_maker->{where_bind};
456 local $sql_maker->{group_bind};
457 local $sql_maker->{having_bind};
97e130fa 458 local $sql_maker->{from_bind};
3f5b99fe 459
460 # we can't scan properly without any quoting (\b doesn't cut it
461 # everywhere), so unless there is proper quoting set - use our
462 # own weird impossible character.
463 # Also in the case of no quoting, we need to explicitly disable
464 # name_sep, otherwise sorry nasty legacy syntax like
465 # { 'count(foo.id)' => { '>' => 3 } } will stop working >:(
466 local $sql_maker->{quote_char} = $sql_maker->{quote_char};
467 local $sql_maker->{name_sep} = $sql_maker->{name_sep};
468
469 unless (defined $sql_maker->{quote_char} and length $sql_maker->{quote_char}) {
e493ecb2 470 $sql_maker->{quote_char} = ["\x00", "\xFF"];
471 # if we don't unset it we screw up retarded but unfortunately working
472 # 'MAX(foo.bar)' => { '>', 3 }
3f5b99fe 473 $sql_maker->{name_sep} = '';
474 }
475
476 my ($lquote, $rquote, $sep) = map { quotemeta $_ } ($sql_maker->_quote_chars, $sql_maker->name_sep);
07f31d19 477
1a736efb 478 # generate sql chunks
479 my $to_scan = {
480 restricting => [
1b8f2dd9 481 ($where
482 ? ($sql_maker->_recurse_where($where))[0]
483 : ()
484 ),
485 ($attrs->{having}
486 ? ($sql_maker->_recurse_where($attrs->{having}))[0]
487 : ()
488 ),
1e4f9fb3 489 ],
490 grouping => [
1b8f2dd9 491 ($attrs->{group_by}
492 ? ($sql_maker->_render_sqla(group_by => $attrs->{group_by}))[0]
493 : (),
494 )
1a736efb 495 ],
97e130fa 496 joining => [
497 $sql_maker->_recurse_from (
498 ref $from->[0] eq 'ARRAY' ? $from->[0][0] : $from->[0],
499 @{$from}[1 .. $#$from],
500 ),
501 ],
1a736efb 502 selecting => [
1b8f2dd9 503 scalar $sql_maker->_render_sqla(select_select => $select),
1e4f9fb3 504 ],
505 ordering => [
506 map { $_->[0] } $self->_extract_order_criteria ($attrs->{order_by}, $sql_maker),
1a736efb 507 ],
508 };
07f31d19 509
1b8f2dd9 510 # local is not enough - need to ensure the inner objects get rebuilt
511 # with the original quoting setup (or lack thereof)
512 $sql_maker->clear_renderer;
513 $sql_maker->clear_converter;
514
1a736efb 515 # throw away empty chunks
516 $_ = [ map { $_ || () } @$_ ] for values %$to_scan;
07f31d19 517
318e3d94 518 # first see if we have any exact matches (qualified or unqualified)
519 for my $type (keys %$to_scan) {
520 for my $piece (@{$to_scan->{$type}}) {
521 if ($colinfo->{$piece} and my $alias = $colinfo->{$piece}{-source_alias}) {
522 $aliases_by_type->{$type}{$alias} ||= { -parents => $alias_list->{$alias}{-join_path}||[] };
523 $aliases_by_type->{$type}{$alias}{-seen_columns}{$colinfo->{$piece}{-fq_colname}} = $piece;
524 }
525 }
526 }
527
528 # now loop through all fully qualified columns and get the corresponding
1a736efb 529 # alias (should work even if they are in scalarrefs)
ad630f4b 530 for my $alias (keys %$alias_list) {
1a736efb 531 my $al_re = qr/
97e130fa 532 $lquote $alias $rquote $sep (?: $lquote ([^$rquote]+) $rquote )?
1a736efb 533 |
97e130fa 534 \b $alias \. ([^\s\)\($rquote]+)?
1a736efb 535 /x;
536
1a736efb 537 for my $type (keys %$to_scan) {
538 for my $piece (@{$to_scan->{$type}}) {
97e130fa 539 if (my @matches = $piece =~ /$al_re/g) {
540 $aliases_by_type->{$type}{$alias} ||= { -parents => $alias_list->{$alias}{-join_path}||[] };
1e4f9fb3 541 $aliases_by_type->{$type}{$alias}{-seen_columns}{"$alias.$_"} = "$alias.$_"
97e130fa 542 for grep { defined $_ } @matches;
543 }
1a736efb 544 }
ad630f4b 545 }
1a736efb 546 }
547
548 # now loop through unqualified column names, and try to locate them within
549 # the chunks
550 for my $col (keys %$colinfo) {
3f5b99fe 551 next if $col =~ / \. /x; # if column is qualified it was caught by the above
1a736efb 552
97e130fa 553 my $col_re = qr/ $lquote ($col) $rquote /x;
07f31d19 554
1a736efb 555 for my $type (keys %$to_scan) {
556 for my $piece (@{$to_scan->{$type}}) {
318e3d94 557 if ( my @matches = $piece =~ /$col_re/g) {
a4812caa 558 my $alias = $colinfo->{$col}{-source_alias};
97e130fa 559 $aliases_by_type->{$type}{$alias} ||= { -parents => $alias_list->{$alias}{-join_path}||[] };
1e4f9fb3 560 $aliases_by_type->{$type}{$alias}{-seen_columns}{"$alias.$_"} = $_
97e130fa 561 for grep { defined $_ } @matches;
a4812caa 562 }
1a736efb 563 }
07f31d19 564 }
565 }
566
567 # Add any non-left joins to the restriction list (such joins are indeed restrictions)
ad630f4b 568 for my $j (values %$alias_list) {
07f31d19 569 my $alias = $j->{-alias} or next;
97e130fa 570 $aliases_by_type->{restricting}{$alias} ||= { -parents => $j->{-join_path}||[] } if (
07f31d19 571 (not $j->{-join_type})
572 or
573 ($j->{-join_type} !~ /^left (?: \s+ outer)? $/xi)
574 );
575 }
576
1e4f9fb3 577 for (keys %$aliases_by_type) {
578 delete $aliases_by_type->{$_} unless keys %{$aliases_by_type->{$_}};
579 }
580
964a3c71 581 return $aliases_by_type;
07f31d19 582}
583
bac358c9 584# This is the engine behind { distinct => 1 }
0a3441ee 585sub _group_over_selection {
560978e2 586 my ($self, $attrs) = @_;
0a3441ee 587
560978e2 588 my $colinfos = $self->_resolve_column_info ($attrs->{from});
0a3441ee 589
590 my (@group_by, %group_index);
591
36fd7f07 592 # the logic is: if it is a { func => val } we assume an aggregate,
593 # otherwise if \'...' or \[...] we assume the user knows what is
594 # going on thus group over it
560978e2 595 for (@{$attrs->{select}}) {
0a3441ee 596 if (! ref($_) or ref ($_) ne 'HASH' ) {
597 push @group_by, $_;
598 $group_index{$_}++;
560978e2 599 if ($colinfos->{$_} and $_ !~ /\./ ) {
0a3441ee 600 # add a fully qualified version as well
560978e2 601 $group_index{"$colinfos->{$_}{-source_alias}.$_"}++;
0a3441ee 602 }
07f31d19 603 }
604 }
ad630f4b 605
560978e2 606 # add any order_by parts *from the main source* that are not already
607 # present in the group_by
0a3441ee 608 # we need to be careful not to add any named functions/aggregates
bac358c9 609 # i.e. order_by => [ ... { count => 'foo' } ... ]
14e26c5f 610 my @leftovers;
560978e2 611 for ($self->_extract_order_criteria($attrs->{order_by})) {
0a3441ee 612 # only consider real columns (for functions the user got to do an explicit group_by)
14e26c5f 613 if (@$_ != 1) {
614 push @leftovers, $_;
615 next;
616 }
bac358c9 617 my $chunk = $_->[0];
560978e2 618
619 if (
620 !$colinfos->{$chunk}
621 or
622 $colinfos->{$chunk}{-source_alias} ne $attrs->{alias}
623 ) {
14e26c5f 624 push @leftovers, $_;
625 next;
560978e2 626 }
0a3441ee 627
560978e2 628 $chunk = $colinfos->{$chunk}{-fq_colname};
0a3441ee 629 push @group_by, $chunk unless $group_index{$chunk}++;
630 }
631
14e26c5f 632 return wantarray
633 ? (\@group_by, (@leftovers ? \@leftovers : undef) )
634 : \@group_by
635 ;
07f31d19 636}
637
d28bb90d 638sub _resolve_ident_sources {
639 my ($self, $ident) = @_;
640
641 my $alias2source = {};
d28bb90d 642
643 # the reason this is so contrived is that $ident may be a {from}
644 # structure, specifying multiple tables to join
6298a324 645 if ( blessed $ident && $ident->isa("DBIx::Class::ResultSource") ) {
d28bb90d 646 # this is compat mode for insert/update/delete which do not deal with aliases
647 $alias2source->{me} = $ident;
d28bb90d 648 }
649 elsif (ref $ident eq 'ARRAY') {
650
651 for (@$ident) {
652 my $tabinfo;
653 if (ref $_ eq 'HASH') {
654 $tabinfo = $_;
d28bb90d 655 }
656 if (ref $_ eq 'ARRAY' and ref $_->[0] eq 'HASH') {
657 $tabinfo = $_->[0];
658 }
659
4376a157 660 $alias2source->{$tabinfo->{-alias}} = $tabinfo->{-rsrc}
661 if ($tabinfo->{-rsrc});
d28bb90d 662 }
663 }
664
90f10b5a 665 return $alias2source;
d28bb90d 666}
667
668# Takes $ident, \@column_names
669#
670# returns { $column_name => \%column_info, ... }
671# also note: this adds -result_source => $rsrc to the column info
672#
09e14fdc 673# If no columns_names are supplied returns info about *all* columns
674# for all sources
d28bb90d 675sub _resolve_column_info {
676 my ($self, $ident, $colnames) = @_;
90f10b5a 677 my $alias2src = $self->_resolve_ident_sources($ident);
d28bb90d 678
52416317 679 my (%seen_cols, @auto_colnames);
d28bb90d 680
681 # compile a global list of column names, to be able to properly
682 # disambiguate unqualified column names (if at all possible)
683 for my $alias (keys %$alias2src) {
684 my $rsrc = $alias2src->{$alias};
685 for my $colname ($rsrc->columns) {
686 push @{$seen_cols{$colname}}, $alias;
3f5b99fe 687 push @auto_colnames, "$alias.$colname" unless $colnames;
d28bb90d 688 }
689 }
690
09e14fdc 691 $colnames ||= [
692 @auto_colnames,
693 grep { @{$seen_cols{$_}} == 1 } (keys %seen_cols),
694 ];
695
52416317 696 my (%return, $colinfos);
d28bb90d 697 foreach my $col (@$colnames) {
52416317 698 my ($source_alias, $colname) = $col =~ m/^ (?: ([^\.]+) \. )? (.+) $/x;
d28bb90d 699
52416317 700 # if the column was seen exactly once - we know which rsrc it came from
701 $source_alias ||= $seen_cols{$colname}[0]
702 if ($seen_cols{$colname} and @{$seen_cols{$colname}} == 1);
d28bb90d 703
52416317 704 next unless $source_alias;
705
706 my $rsrc = $alias2src->{$source_alias}
707 or next;
708
709 $return{$col} = {
6395604e 710 %{
711 ( $colinfos->{$source_alias} ||= $rsrc->columns_info )->{$colname}
712 ||
713 $self->throw_exception(
714 "No such column '$colname' on source " . $rsrc->source_name
715 );
716 },
d28bb90d 717 -result_source => $rsrc,
52416317 718 -source_alias => $source_alias,
81bf295c 719 -fq_colname => $col eq $colname ? "$source_alias.$col" : $col,
720 -colname => $colname,
d28bb90d 721 };
81bf295c 722
723 $return{"$source_alias.$colname"} = $return{$col} if $col eq $colname;
d28bb90d 724 }
725
726 return \%return;
727}
728
289ac713 729# The DBIC relationship chaining implementation is pretty simple - every
730# new related_relationship is pushed onto the {from} stack, and the {select}
731# window simply slides further in. This means that when we count somewhere
732# in the middle, we got to make sure that everything in the join chain is an
733# actual inner join, otherwise the count will come back with unpredictable
734# results (a resultset may be generated with _some_ rows regardless of if
735# the relation which the $rs currently selects has rows or not). E.g.
736# $artist_rs->cds->count - normally generates:
737# SELECT COUNT( * ) FROM artist me LEFT JOIN cd cds ON cds.artist = me.artistid
738# which actually returns the number of artists * (number of cds || 1)
739#
740# So what we do here is crawl {from}, determine if the current alias is at
741# the top of the stack, and if not - make sure the chain is inner-joined down
742# to the root.
743#
31a8aaaf 744sub _inner_join_to_node {
289ac713 745 my ($self, $from, $alias) = @_;
746
747 # subqueries and other oddness are naturally not supported
748 return $from if (
749 ref $from ne 'ARRAY'
750 ||
751 @$from <= 1
752 ||
753 ref $from->[0] ne 'HASH'
754 ||
755 ! $from->[0]{-alias}
756 ||
7eb76996 757 $from->[0]{-alias} eq $alias # this last bit means $alias is the head of $from - nothing to do
289ac713 758 );
759
760 # find the current $alias in the $from structure
761 my $switch_branch;
762 JOINSCAN:
763 for my $j (@{$from}[1 .. $#$from]) {
764 if ($j->[0]{-alias} eq $alias) {
765 $switch_branch = $j->[0]{-join_path};
766 last JOINSCAN;
767 }
768 }
769
7eb76996 770 # something else went quite wrong
289ac713 771 return $from unless $switch_branch;
772
773 # So it looks like we will have to switch some stuff around.
774 # local() is useless here as we will be leaving the scope
775 # anyway, and deep cloning is just too fucking expensive
8273e845 776 # So replace the first hashref in the node arrayref manually
289ac713 777 my @new_from = ($from->[0]);
faeb2407 778 my $sw_idx = { map { (values %$_), 1 } @$switch_branch }; #there's one k/v per join-path
289ac713 779
780 for my $j (@{$from}[1 .. $#$from]) {
781 my $jalias = $j->[0]{-alias};
782
783 if ($sw_idx->{$jalias}) {
784 my %attrs = %{$j->[0]};
785 delete $attrs{-join_type};
786 push @new_from, [
787 \%attrs,
788 @{$j}[ 1 .. $#$j ],
789 ];
790 }
791 else {
792 push @new_from, $j;
793 }
794 }
795
796 return \@new_from;
797}
798
bac358c9 799sub _extract_order_criteria {
1a736efb 800 my ($self, $order_by, $sql_maker) = @_;
c0748280 801
10cef607 802 $sql_maker ||= $self->sql_maker;
803
804 my $order_dq = $sql_maker->converter->_order_by_to_dq($order_by);
805
806 my @by;
807 while (is_Literal($order_dq)) {
808 push @by, $order_dq->{by};
809 $order_dq = $order_dq->{from};
810 }
811
812 return map { [ $sql_maker->_render_dq($_) ] } @by;
813
1a736efb 814 my $parser = sub {
e6977bbb 815 my ($sql_maker, $order_by, $orig_quote_chars) = @_;
c0748280 816
1a736efb 817 return scalar $sql_maker->_order_by_chunks ($order_by)
818 unless wantarray;
c0748280 819
e6977bbb 820 my ($lq, $rq, $sep) = map { quotemeta($_) } (
821 ($orig_quote_chars ? @$orig_quote_chars : $sql_maker->_quote_chars),
822 $sql_maker->name_sep
823 );
824
1a736efb 825 my @chunks;
bac358c9 826 for ($sql_maker->_order_by_chunks ($order_by) ) {
e6977bbb 827 my $chunk = ref $_ ? [ @$_ ] : [ $_ ];
cb3e87f5 828 ($chunk->[0]) = $sql_maker->_split_order_chunk($chunk->[0]);
e6977bbb 829
830 # order criteria may have come back pre-quoted (literals and whatnot)
831 # this is fragile, but the best we can currently do
832 $chunk->[0] =~ s/^ $lq (.+?) $rq $sep $lq (.+?) $rq $/"$1.$2"/xe
833 or $chunk->[0] =~ s/^ $lq (.+) $rq $/$1/x;
834
1a736efb 835 push @chunks, $chunk;
bac6c4fb 836 }
1a736efb 837
838 return @chunks;
839 };
840
841 if ($sql_maker) {
842 return $parser->($sql_maker, $order_by);
bac6c4fb 843 }
844 else {
1a736efb 845 $sql_maker = $self->sql_maker;
e6977bbb 846
847 # pass these in to deal with literals coming from
848 # the user or the deep guts of prefetch
849 my $orig_quote_chars = [$sql_maker->_quote_chars];
850
1a736efb 851 local $sql_maker->{quote_char};
e6977bbb 852 return $parser->($sql_maker, $order_by, $orig_quote_chars);
bac6c4fb 853 }
bac6c4fb 854}
855
7cec4356 856sub _order_by_is_stable {
5f11e54f 857 my ($self, $ident, $order_by, $where) = @_;
c0748280 858
5f11e54f 859 my $colinfo = $self->_resolve_column_info($ident, [
860 (map { $_->[0] } $self->_extract_order_criteria($order_by)),
861 $where ? @{$self->_extract_fixed_condition_columns($where)} :(),
862 ]);
c0748280 863
7cec4356 864 return undef unless keys %$colinfo;
865
866 my $cols_per_src;
867 $cols_per_src->{$_->{-source_alias}}{$_->{-colname}} = $_ for values %$colinfo;
868
869 for (values %$cols_per_src) {
870 my $src = (values %$_)[0]->{-result_source};
871 return 1 if $src->_identifying_column_set($_);
c0748280 872 }
873
7cec4356 874 return undef;
875}
876
0e81e691 877# this is almost identical to the above, except it accepts only
878# a single rsrc, and will succeed only if the first portion of the order
879# by is stable.
880# returns that portion as a colinfo hashref on success
881sub _main_source_order_by_portion_is_stable {
882 my ($self, $main_rsrc, $order_by, $where) = @_;
883
884 die "Huh... I expect a blessed result_source..."
885 if ref($main_rsrc) eq 'ARRAY';
886
887 my @ord_cols = map
888 { $_->[0] }
889 ( $self->_extract_order_criteria($order_by) )
890 ;
891 return unless @ord_cols;
892
318e3d94 893 my $colinfos = $self->_resolve_column_info($main_rsrc);
894
0e81e691 895 for (0 .. $#ord_cols) {
896 if (
897 ! $colinfos->{$ord_cols[$_]}
898 or
899 $colinfos->{$ord_cols[$_]}{-result_source} != $main_rsrc
900 ) {
901 $#ord_cols = $_ - 1;
902 last;
903 }
904 }
905
906 # we just truncated it above
907 return unless @ord_cols;
908
0e81e691 909 my $order_portion_ci = { map {
910 $colinfos->{$_}{-colname} => $colinfos->{$_},
911 $colinfos->{$_}{-fq_colname} => $colinfos->{$_},
912 } @ord_cols };
913
318e3d94 914 # since all we check here are the start of the order_by belonging to the
915 # top level $rsrc, a present identifying set will mean that the resultset
916 # is ordered by its leftmost table in a stable manner
917 #
918 # RV of _identifying_column_set contains unqualified names only
919 my $unqualified_idset = $main_rsrc->_identifying_column_set({
920 ( $where ? %{
921 $self->_resolve_column_info(
922 $main_rsrc, $self->_extract_fixed_condition_columns($where)
923 )
924 } : () ),
925 %$order_portion_ci
926 }) or return;
927
928 my $ret_info;
929 my %unqualified_idcols_from_order = map {
930 $order_portion_ci->{$_} ? ( $_ => $order_portion_ci->{$_} ) : ()
931 } @$unqualified_idset;
932
933 # extra optimization - cut the order_by at the end of the identifying set
934 # (just in case the user was stupid and overlooked the obvious)
935 for my $i (0 .. $#ord_cols) {
936 my $col = $ord_cols[$i];
937 my $unqualified_colname = $order_portion_ci->{$col}{-colname};
938 $ret_info->{$col} = { %{$order_portion_ci->{$col}}, -idx_in_order_subset => $i };
939 delete $unqualified_idcols_from_order{$ret_info->{$col}{-colname}};
940
941 # we didn't reach the end of the identifying portion yet
942 return $ret_info unless keys %unqualified_idcols_from_order;
943 }
0e81e691 944
318e3d94 945 die 'How did we get here...';
0e81e691 946}
947
4a0eed52 948# returns an arrayref of column names which *definitely* have some
5f11e54f 949# sort of non-nullable equality requested in the given condition
950# specification. This is used to figure out if a resultset is
951# constrained to a column which is part of a unique constraint,
952# which in turn allows us to better predict how ordering will behave
953# etc.
954#
955# this is a rudimentary, incomplete, and error-prone extractor
956# however this is OK - it is conservative, and if we can not find
957# something that is in fact there - the stack will recover gracefully
958# Also - DQ and the mst it rode in on will save us all RSN!!!
959sub _extract_fixed_condition_columns {
960 my ($self, $where, $nested) = @_;
961
962 return unless ref $where eq 'HASH';
963
964 my @cols;
965 for my $lhs (keys %$where) {
966 if ($lhs =~ /^\-and$/i) {
967 push @cols, ref $where->{$lhs} eq 'ARRAY'
968 ? ( map { $self->_extract_fixed_condition_columns($_, 1) } @{$where->{$lhs}} )
969 : $self->_extract_fixed_condition_columns($where->{$lhs}, 1)
970 ;
971 }
972 elsif ($lhs !~ /^\-/) {
973 my $val = $where->{$lhs};
974
975 push @cols, $lhs if (defined $val and (
976 ! ref $val
977 or
978 (ref $val eq 'HASH' and keys %$val == 1 and defined $val->{'='})
979 ));
980 }
981 }
982 return $nested ? @cols : \@cols;
c0748280 983}
bac6c4fb 984
d28bb90d 9851;