Another parser microoptimisation - lose nullability checks where possible
[dbsrgits/DBIx-Class-Historic.git] / lib / DBIx / Class / ResultSource / RowParser / Util.pm
CommitLineData
9f98c4b2 1package # hide from the pauses
2 DBIx::Class::ResultSource::RowParser::Util;
3
4use strict;
5use warnings;
6
ce556881 7use List::Util 'first';
9f98c4b2 8use B 'perlstring';
9
10use base 'Exporter';
11our @EXPORT_OK = qw(
12 assemble_simple_parser
13 assemble_collapsing_parser
14);
15
52864fbd 16# working title - we are hoping to extract this eventually...
17our $null_branch_class = 'DBIx::ResultParser::RelatedNullBranch';
18
9f98c4b2 19sub assemble_simple_parser {
20 #my ($args) = @_;
21
22 # the non-collapsing assembler is easy
23 # FIXME SUBOPTIMAL there could be a yet faster way to do things here, but
24 # need to try an actual implementation and benchmark it:
25 #
26 # <timbunce_> First setup the nested data structure you want for each row
27 # Then call bind_col() to alias the row fields into the right place in
28 # the data structure, then to fetch the data do:
29 # push @rows, dclone($row_data_struct) while ($sth->fetchrow);
30 #
31 my $parser_src = sprintf('$_ = %s for @{$_[0]}', __visit_infmap_simple($_[0]) );
32
33 # change the quoted placeholders to unquoted alias-references
34 $parser_src =~ s/ \' \xFF__VALPOS__(\d+)__\xFF \' /"\$_->[$1]"/gex;
35
bdbd2ae8 36 $parser_src = " { use strict; use warnings FATAL => 'all';\n$parser_src\n }";
9f98c4b2 37}
38
39# the simple non-collapsing nested structure recursor
40sub __visit_infmap_simple {
41 my $args = shift;
42
43 my $my_cols = {};
44 my $rel_cols;
45 for (keys %{$args->{val_index}}) {
46 if ($_ =~ /^ ([^\.]+) \. (.+) /x) {
47 $rel_cols->{$1}{$2} = $args->{val_index}{$_};
48 }
49 else {
50 $my_cols->{$_} = $args->{val_index}{$_};
51 }
52 }
53
54 my @relperl;
55 for my $rel (sort keys %$rel_cols) {
56
52864fbd 57 my $rel_struct = __visit_infmap_simple({ %$args,
9f98c4b2 58 val_index => $rel_cols->{$rel},
9f98c4b2 59 });
60
52864fbd 61 if (keys %$my_cols) {
ce556881 62
52864fbd 63 my $branch_null_checks = join ' && ', map
ce556881 64 { "( ! defined '\xFF__VALPOS__${_}__\xFF' )" }
65 sort { $a <=> $b } values %{$rel_cols->{$rel}}
66 ;
67
79adc44f 68 if ($args->{prune_null_branches}) {
52864fbd 69 $rel_struct = sprintf ( '( (%s) ? undef : %s )',
70 $branch_null_checks,
71 $rel_struct,
72 );
73 }
74 else {
75 $rel_struct = sprintf ( '( (%s) ? bless( (%s), %s ) : %s )',
76 $branch_null_checks,
77 $rel_struct,
78 perlstring($null_branch_class),
79 $rel_struct,
80 );
81 }
ce556881 82 }
52864fbd 83
84 push @relperl, sprintf '( %s => %s )',
85 perlstring($rel),
86 $rel_struct,
87 ;
88
9f98c4b2 89 }
90
ce556881 91 my $me_struct;
a8f62ee0 92 $me_struct = __result_struct_to_source($my_cols) if keys %$my_cols;
9f98c4b2 93
ce556881 94 if ($args->{hri_style}) {
95 $me_struct =~ s/^ \s* \{ | \} \s* $//gx
96 if $me_struct;
97
98 return sprintf '{ %s }', join (', ', $me_struct||(), @relperl);
99 }
100 else {
101 return sprintf '[%s]', join (',',
102 $me_struct || 'undef',
103 @relperl ? sprintf ('{ %s }', join (',', @relperl)) : (),
104 );
105 }
9f98c4b2 106}
107
108sub assemble_collapsing_parser {
109 my $args = shift;
110
06b3406d 111 # it may get unset further down
79adc44f 112 my $no_rowid_container = $args->{prune_null_branches};
06b3406d 113
9f98c4b2 114 my ($top_node_key, $top_node_key_assembler);
115
116 if (scalar @{$args->{collapse_map}{-identifying_columns}}) {
117 $top_node_key = join ('', map
118 { "{'\xFF__IDVALPOS__${_}__\xFF'}" }
119 @{$args->{collapse_map}{-identifying_columns}}
120 );
121 }
122 elsif( my @variants = @{$args->{collapse_map}{-identifying_columns_variants}} ) {
123
124 my @path_parts = map { sprintf
125 "( ( defined '\xFF__VALPOS__%d__\xFF' ) && (join qq(\xFF), '', %s, '') )",
ce556881 126 $_->[0], # checking just first is enough - one ID defined, all defined
9f98c4b2 127 ( join ', ', map { "'\xFF__VALPOS__${_}__\xFF'" } @$_ ),
128 } @variants;
129
130 my $virtual_column_idx = (scalar keys %{$args->{val_index}} ) + 1;
131
7596ddca 132 $top_node_key = "{'\xFF__IDVALPOS__${virtual_column_idx}__\xFF'}";
9f98c4b2 133
7596ddca 134 $top_node_key_assembler = sprintf "'\xFF__IDVALPOS__%d__\xFF' = (%s);",
135 $virtual_column_idx,
136 "\n" . join( "\n or\n", @path_parts, qq{"\0\$rows_pos\0"} )
137 ;
9f98c4b2 138
139 $args->{collapse_map} = {
140 %{$args->{collapse_map}},
141 -custom_node_key => $top_node_key,
142 };
143
06b3406d 144 $no_rowid_container = 0;
9f98c4b2 145 }
146 else {
147 die('Unexpected collapse map contents');
148 }
149
150 my ($data_assemblers, $stats) = __visit_infmap_collapse ($args);
151
06b3406d 152 my @idcol_args = $no_rowid_container ? ('', '') : (
aa1d8a87 153 ', %cur_row_ids', # only declare the variable if we'll use it
3b4cd124 154 join ("\n", map {
5e6d06f4 155 # in case we prune - we will never hit these undefs
156 $args->{prune_null_branches}
157 ? qq(\$cur_row_ids{$_} = \$cur_row_data->[$_];)
158 : qq(\$cur_row_ids{$_} = defined(\$cur_row_data->[$_]) ? \$cur_row_data->[$_] : "\0NULL\xFF\$rows_pos\xFF$_\0";)
159 } sort { $a <=> $b } keys %{ $stats->{idcols_seen} } ),
7596ddca 160 );
9f98c4b2 161
7596ddca 162 my $parser_src = sprintf (<<'EOS', @idcol_args, $top_node_key_assembler||'', $top_node_key, join( "\n", @{$data_assemblers||[]} ) );
9f98c4b2 163### BEGIN LITERAL STRING EVAL
aa1d8a87 164 my $rows_pos = 0;
165 my ($result_pos, @collapse_idx, $cur_row_data %1$s);
166
9f98c4b2 167 # this loop is a bit arcane - the rationale is that the passed in
168 # $_[0] will either have only one row (->next) or will have all
169 # rows already pulled in (->all and/or unordered). Given that the
170 # result can be rather large - we reuse the same already allocated
171 # array, since the collapsed prefetch is smaller by definition.
172 # At the end we cut the leftovers away and move on.
3b4cd124 173 while ($cur_row_data = (
174 ( $rows_pos >= 0 and $_[0][$rows_pos++] )
175 or
176 ( $_[1] and $rows_pos = -1 and $_[1]->() )
177 ) ) {
178
5e6d06f4 179 # this code exists only when we are using a cur_row_ids
180 # furthermore the undef checks may or may not be there
181 # depending on whether we prune or not
7596ddca 182 #
9f98c4b2 183 # due to left joins some of the ids may be NULL/undef, and
184 # won't play well when used as hash lookups
185 # we also need to differentiate NULLs on per-row/per-col basis
ce556881 186 # (otherwise folding of optional 1:1s will be greatly confused
3b4cd124 187%2$s
9f98c4b2 188
7596ddca 189 # in the case of an underdefined root - calculate the virtual id (otherwise no code at all)
3b4cd124 190%3$s
9f98c4b2 191
aa1d8a87 192 # if we were supplied a coderef - we are collapsing lazily (the set
193 # is ordered properly)
194 # as long as we have a result already and the next result is new we
195 # return the pre-read data and bail
3b4cd124 196$_[1] and $result_pos and ! $collapse_idx[0]%4$s and (unshift @{$_[2]}, $cur_row_data) and last;
9f98c4b2 197
198 # the rel assemblers
7596ddca 199%5$s
9f98c4b2 200
9f98c4b2 201 }
202
aa1d8a87 203 $#{$_[0]} = $result_pos - 1; # truncate the passed in array to where we filled it with results
9f98c4b2 204### END LITERAL STRING EVAL
205EOS
206
207 # !!! note - different var than the one above
208 # change the quoted placeholders to unquoted alias-references
209 $parser_src =~ s/ \' \xFF__VALPOS__(\d+)__\xFF \' /"\$cur_row_data->[$1]"/gex;
06b3406d 210 $parser_src =~ s/
211 \' \xFF__IDVALPOS__(\d+)__\xFF \'
212 /
213 $no_rowid_container ? "\$cur_row_data->[$1]" : "\$cur_row_ids{$1}"
214 /gex;
9f98c4b2 215
bdbd2ae8 216 $parser_src = " { use strict; use warnings FATAL => 'all';\n$parser_src\n }";
9f98c4b2 217}
218
219
220# the collapsing nested structure recursor
221sub __visit_infmap_collapse {
222 my $args = {%{ shift() }};
223
224 my $cur_node_idx = ${ $args->{-node_idx_counter} ||= \do { my $x = 0} }++;
225
ce556881 226 my ($my_cols, $rel_cols) = {};
9f98c4b2 227 for ( keys %{$args->{val_index}} ) {
228 if ($_ =~ /^ ([^\.]+) \. (.+) /x) {
229 $rel_cols->{$1}{$2} = $args->{val_index}{$_};
230 }
231 else {
232 $my_cols->{$_} = $args->{val_index}{$_};
233 }
234 }
235
ce556881 236
ce556881 237 if ($args->{hri_style}) {
238 delete $my_cols->{$_} for grep { $rel_cols->{$_} } keys %$my_cols;
239 }
9f98c4b2 240
52864fbd 241 my $me_struct;
a8f62ee0 242 $me_struct = __result_struct_to_source($my_cols) if keys %$my_cols;
ce556881 243
52864fbd 244 $me_struct = sprintf( '[ %s ]', $me_struct||'' )
245 unless $args->{hri_style};
246
247
248 my $node_key = $args->{collapse_map}->{-custom_node_key} || join ('', map
249 { "{'\xFF__IDVALPOS__${_}__\xFF'}" }
250 @{$args->{collapse_map}->{-identifying_columns}}
251 );
ce556881 252 my $node_idx_slot = sprintf '$collapse_idx[%d]%s', $cur_node_idx, $node_key;
9f98c4b2 253
52864fbd 254
9f98c4b2 255 my @src;
ce556881 256
9f98c4b2 257 if ($cur_node_idx == 0) {
aa1d8a87 258 push @src, sprintf( '%s ||= $_[0][$result_pos++] = %s;',
9f98c4b2 259 $node_idx_slot,
aa1d8a87 260 $me_struct || '{}',
261 );
9f98c4b2 262 }
9f98c4b2 263 else {
ce556881 264 my $parent_attach_slot = sprintf( '$collapse_idx[%d]%s%s{%s}',
265 @{$args}{qw/-parent_node_idx -parent_node_key/},
266 $args->{hri_style} ? '' : '[1]',
267 perlstring($args->{-node_relname}),
9f98c4b2 268 );
ce556881 269
270 if ($args->{collapse_map}->{-is_single}) {
271 push @src, sprintf ( '%s ||= %s%s;',
272 $parent_attach_slot,
273 $node_idx_slot,
aa1d8a87 274 $me_struct ? " = $me_struct" : '',
ce556881 275 );
276 }
277 else {
278 push @src, sprintf('(! %s) and push @{%s}, %s%s;',
279 $node_idx_slot,
280 $parent_attach_slot,
281 $node_idx_slot,
282 $me_struct ? " = $me_struct" : '',
283 );
284 }
9f98c4b2 285 }
286
ce556881 287 my $known_present_ids = { map { $_ => 1 } @{$args->{collapse_map}{-identifying_columns}} };
288 my ($stats, $rel_src);
289
9f98c4b2 290 for my $rel (sort keys %$rel_cols) {
291
ce556881 292 my $relinfo = $args->{collapse_map}{$rel};
9f98c4b2 293
ce556881 294 ($rel_src, $stats->{$rel}) = __visit_infmap_collapse({ %$args,
9f98c4b2 295 val_index => $rel_cols->{$rel},
ce556881 296 collapse_map => $relinfo,
9f98c4b2 297 -parent_node_idx => $cur_node_idx,
298 -parent_node_key => $node_key,
299 -node_relname => $rel,
300 });
301
ce556881 302 my $rel_src_pos = $#src + 1;
303 push @src, @$rel_src;
304
305 if (
ce556881 306 $relinfo->{-is_optional}
307 and
308 defined ( my $first_distinct_child_idcol = first
309 { ! $known_present_ids->{$_} }
310 @{$relinfo->{-identifying_columns}}
311 )
312 ) {
313
79adc44f 314 if ($args->{prune_null_branches}) {
ce556881 315
7596ddca 316 # start of wrap of the entire chain in a conditional
79adc44f 317 splice @src, $rel_src_pos, 0, sprintf "( ! defined %s )\n ? %s%s{%s} = %s\n : do {",
7596ddca 318 "'\xFF__VALPOS__${first_distinct_child_idcol}__\xFF'",
52864fbd 319 $node_idx_slot,
79adc44f 320 $args->{hri_style} ? '' : '[1]',
52864fbd 321 perlstring($rel),
79adc44f 322 ($args->{hri_style} && $relinfo->{-is_single}) ? 'undef' : '[]'
7596ddca 323 ;
324
325 # end of wrap
326 push @src, '};'
52864fbd 327 }
328 else {
329
330 splice @src, $rel_src_pos + 1, 0, sprintf ( '(defined %s) or bless (%s[1]{%s}, %s);',
331 "'\xFF__VALPOS__${first_distinct_child_idcol}__\xFF'",
332 $node_idx_slot,
333 perlstring($rel),
334 perlstring($null_branch_class),
335 );
336 }
ce556881 337 }
9f98c4b2 338 }
339
340 return (
ce556881 341 \@src,
9f98c4b2 342 {
343 idcols_seen => {
344 ( map { %{ $_->{idcols_seen} } } values %$stats ),
345 ( map { $_ => 1 } @{$args->{collapse_map}->{-identifying_columns}} ),
346 }
347 }
348 );
349}
350
a8f62ee0 351sub __result_struct_to_source {
352 sprintf( '{ %s }', join (', ', map
353 { sprintf "%s => '\xFF__VALPOS__%d__\xFF'", perlstring($_), $_[0]{$_} }
354 sort keys %{$_[0]}
355 ));
9f98c4b2 356}
357
3581;