changed add_attribute to add_to_attribute
[catagits/HTML-Zoom.git] / lib / HTML / Zoom / FilterBuilder.pm
CommitLineData
456a815d 1package HTML::Zoom::FilterBuilder;
2
456a815d 3use strict;
4use warnings FATAL => 'all';
d80786d0 5use base qw(HTML::Zoom::SubObject);
456a815d 6use HTML::Zoom::CodeStream;
7
456a815d 8sub _stream_from_code {
d80786d0 9 shift->_zconfig->stream_utils->stream_from_code(@_)
456a815d 10}
11
12sub _stream_from_array {
d80786d0 13 shift->_zconfig->stream_utils->stream_from_array(@_)
456a815d 14}
15
3cdbc13f 16sub _stream_from_proto {
d80786d0 17 shift->_zconfig->stream_utils->stream_from_proto(@_)
3cdbc13f 18}
19
456a815d 20sub _stream_concat {
d80786d0 21 shift->_zconfig->stream_utils->stream_concat(@_)
456a815d 22}
23
6d0f20a6 24sub _flatten_stream_of_streams {
25 shift->_zconfig->stream_utils->flatten_stream_of_streams(@_)
26}
27
456a815d 28sub set_attribute {
1c4455ae 29 my $self = shift;
30 my ($name, $value) = $self->_parse_attribute_args(@_);
456a815d 31 sub {
8f962884 32 my $a = (my $evt = $_[0])->{attrs};
456a815d 33 my $e = exists $a->{$name};
34 +{ %$evt, raw => undef, raw_attrs => undef,
35 attrs => { %$a, $name => $value },
36 ($e # add to name list if not present
37 ? ()
38 : (attr_names => [ @{$evt->{attr_names}}, $name ]))
39 }
40 };
41}
42
1c4455ae 43sub _parse_attribute_args {
44 my $self = shift;
2daa653a 45 # allow ->add_to_attribute(name => 'value')
46 # or ->add_to_attribute({ name => 'name', value => 'value' })
1c4455ae 47 my ($name, $value) = @_ > 1 ? @_ : @{$_[0]}{qw(name value)};
48 return ($name, $self->_zconfig->parser->html_escape($value));
49}
50
456a815d 51sub add_attribute {
2daa653a 52 die "renamed to add_to_attribute. killing this entirely for 1.0";
53}
54
55sub add_to_attribute {
1c4455ae 56 my $self = shift;
57 my ($name, $value) = $self->_parse_attribute_args(@_);
456a815d 58 sub {
8f962884 59 my $a = (my $evt = $_[0])->{attrs};
456a815d 60 my $e = exists $a->{$name};
61 +{ %$evt, raw => undef, raw_attrs => undef,
62 attrs => {
63 %$a,
64 $name => join(' ', ($e ? $a->{$name} : ()), $value)
65 },
66 ($e # add to name list if not present
67 ? ()
68 : (attr_names => [ @{$evt->{attr_names}}, $name ]))
69 }
70 };
71}
72
73sub remove_attribute {
74 my ($self, $args) = @_;
1c4455ae 75 my $name = (ref($args) eq 'HASH') ? $args->{name} : $args;
456a815d 76 sub {
8f962884 77 my $a = (my $evt = $_[0])->{attrs};
456a815d 78 return $evt unless exists $a->{$name};
79 $a = { %$a }; delete $a->{$name};
80 +{ %$evt, raw => undef, raw_attrs => undef,
81 attrs => $a,
82 attr_names => [ grep $_ ne $name, @{$evt->{attr_names}} ]
83 }
84 };
85}
86
76cecb10 87sub collect {
88 my ($self, $options) = @_;
1c4455ae 89 my ($into, $passthrough, $content, $filter, $flush_before) =
90 @{$options}{qw(into passthrough content filter flush_before)};
76cecb10 91 sub {
92 my ($evt, $stream) = @_;
b4d044eb 93 # We wipe the contents of @$into here so that other actions depending
94 # on this (such as a repeater) can be invoked multiple times easily.
95 # I -suspect- it's better for that state reset to be managed here; if it
96 # ever becomes painful the decision should be revisited
97 if ($into) {
865bb5d2 98 @$into = $content ? () : ($evt);
b4d044eb 99 }
76cecb10 100 if ($evt->{is_in_place_close}) {
865bb5d2 101 return $evt if $passthrough || $content;
76cecb10 102 return;
103 }
104 my $name = $evt->{name};
105 my $depth = 1;
865bb5d2 106 my $_next = $content ? 'peek' : 'next';
d80786d0 107 $stream = do { local $_ = $stream; $filter->($stream) } if $filter;
76cecb10 108 my $collector = $self->_stream_from_code(sub {
109 return unless $stream;
110 while (my ($evt) = $stream->$_next) {
111 $depth++ if ($evt->{type} eq 'OPEN');
112 $depth-- if ($evt->{type} eq 'CLOSE');
113 unless ($depth) {
114 undef $stream;
865bb5d2 115 return if $content;
76cecb10 116 push(@$into, $evt) if $into;
117 return $evt if $passthrough;
118 return;
119 }
120 push(@$into, $evt) if $into;
865bb5d2 121 $stream->next if $content;
76cecb10 122 return $evt if $passthrough;
123 }
124 die "Never saw closing </${name}> before end of source";
125 });
1c4455ae 126 if ($flush_before) {
127 if ($passthrough||$content) {
128 $evt = { %$evt, flush => 1 };
129 } else {
130 $evt = { type => 'EMPTY', flush => 1 };
131 }
132 }
133 return ($passthrough||$content||$flush_before)
134 ? [ $evt, $collector ]
135 : $collector;
76cecb10 136 };
137}
138
865bb5d2 139sub collect_content {
140 my ($self, $options) = @_;
141 $self->collect({ %{$options||{}}, content => 1 })
142}
143
456a815d 144sub add_before {
145 my ($self, $events) = @_;
8f962884 146 sub { return $self->_stream_from_array(@$events, $_[0]) };
456a815d 147}
148
149sub add_after {
150 my ($self, $events) = @_;
b616863d 151 my $coll_proto = $self->collect({ passthrough => 1 });
456a815d 152 sub {
8f962884 153 my ($evt) = @_;
456a815d 154 my $emit = $self->_stream_from_array(@$events);
b616863d 155 my $coll = &$coll_proto;
995bc8be 156 return ref($coll) eq 'HASH' # single event, no collect
157 ? [ $coll, $emit ]
158 : [ $coll->[0], $self->_stream_concat($coll->[1], $emit) ];
456a815d 159 };
8f962884 160}
456a815d 161
865bb5d2 162sub prepend_content {
456a815d 163 my ($self, $events) = @_;
164 sub {
8f962884 165 my ($evt) = @_;
456a815d 166 if ($evt->{is_in_place_close}) {
167 $evt = { %$evt }; delete @{$evt}{qw(raw is_in_place_close)};
168 return [ $evt, $self->_stream_from_array(
169 @$events, { type => 'CLOSE', name => $evt->{name} }
170 ) ];
171 }
172 return $self->_stream_from_array($evt, @$events);
173 };
174}
175
865bb5d2 176sub append_content {
8f962884 177 my ($self, $events) = @_;
865bb5d2 178 my $coll_proto = $self->collect({ passthrough => 1, content => 1 });
8f962884 179 sub {
180 my ($evt) = @_;
181 if ($evt->{is_in_place_close}) {
182 $evt = { %$evt }; delete @{$evt}{qw(raw is_in_place_close)};
183 return [ $evt, $self->_stream_from_array(
184 @$events, { type => 'CLOSE', name => $evt->{name} }
185 ) ];
186 }
b616863d 187 my $coll = &$coll_proto;
8f962884 188 my $emit = $self->_stream_from_array(@$events);
189 return [ $coll->[0], $self->_stream_concat($coll->[1], $emit) ];
190 };
191}
192
456a815d 193sub replace {
3cdbc13f 194 my ($self, $replace_with, $options) = @_;
b616863d 195 my $coll_proto = $self->collect($options);
456a815d 196 sub {
197 my ($evt, $stream) = @_;
3cdbc13f 198 my $emit = $self->_stream_from_proto($replace_with);
b616863d 199 my $coll = &$coll_proto;
a88c1c57 200 # if we're replacing the contents of an in place close
201 # then we need to handle that here
202 if ($options->{content}
203 && ref($coll) eq 'HASH'
ec687101 204 && $coll->{is_in_place_close}
a88c1c57 205 ) {
a88c1c57 206 my $close = $stream->next;
ec687101 207 # shallow copy and nuke in place and raw (to force smart print)
208 $_ = { %$_ }, delete @{$_}{qw(is_in_place_close raw)} for ($coll, $close);
a88c1c57 209 $emit = $self->_stream_concat(
210 $emit,
211 $self->_stream_from_array($close),
212 );
213 }
451b3b30 214 # For a straightforward replace operation we can, in fact, do the emit
215 # -before- the collect, and my first cut did so. However in order to
216 # use the captured content in generating the new content, we need
217 # the collect stage to happen first - and it seems highly unlikely
218 # that in normal operation the collect phase will take long enough
219 # for the difference to be noticeable
11cc25dd 220 return
221 ($coll
a88c1c57 222 ? (ref $coll eq 'ARRAY' # [ event, stream ]
451b3b30 223 ? [ $coll->[0], $self->_stream_concat($coll->[1], $emit) ]
a88c1c57 224 : (ref $coll eq 'HASH' # event or stream?
225 ? [ $coll, $emit ]
226 : $self->_stream_concat($coll, $emit))
11cc25dd 227 )
228 : $emit
229 );
456a815d 230 };
231}
232
865bb5d2 233sub replace_content {
234 my ($self, $replace_with, $options) = @_;
235 $self->replace($replace_with, { %{$options||{}}, content => 1 })
236}
237
3cdbc13f 238sub repeat {
239 my ($self, $repeat_for, $options) = @_;
240 $options->{into} = \my @into;
f8ed299b 241 my @between;
242 my $repeat_between = delete $options->{repeat_between};
243 if ($repeat_between) {
f8ed299b 244 $options->{filter} = sub {
d80786d0 245 $_->select($repeat_between)->collect({ into => \@between })
f8ed299b 246 };
247 }
3cdbc13f 248 my $repeater = sub {
f8ed299b 249 my $s = $self->_stream_from_proto($repeat_for);
250 # We have to test $repeat_between not @between here because
251 # at the point we're constructing our return stream @between
252 # hasn't been populated yet - but we can test @between in the
253 # map routine because it has been by then and that saves us doing
254 # the extra stream construction if we don't need it.
6d0f20a6 255 $self->_flatten_stream_of_streams(do {
256 if ($repeat_between) {
257 $s->map(sub {
258 local $_ = $self->_stream_from_array(@into);
259 (@between && $s->peek)
260 ? $self->_stream_concat(
261 $_[0]->($_), $self->_stream_from_array(@between)
262 )
263 : $_[0]->($_)
264 })
265 } else {
266 $s->map(sub {
267 local $_ = $self->_stream_from_array(@into);
268 $_[0]->($_)
f8ed299b 269 })
6d0f20a6 270 }
271 })
3cdbc13f 272 };
273 $self->replace($repeater, $options);
274}
275
865bb5d2 276sub repeat_content {
277 my ($self, $repeat_for, $options) = @_;
278 $self->repeat($repeat_for, { %{$options||{}}, content => 1 })
279}
280
456a815d 2811;
556c8616 282
283=head1 NAME
284
285HTML::Zoom::FilterBuilder - Add Filters to a Stream
286
244252e7 287=head1 SYNOPSIS
288
0d8f057e 289 use HTML::Zoom;
290 my $root = HTML::Zoom
291 ->from_html(<<MAIN);
292 <html>
293 <head>
294 <title>Default Title</title>
295 </head>
296 <body>
297 Default Content
298 </body>
299 </html>
300 MAIN
301
302 my $body = HTML::Zoom
303 ->from_html(<<BODY);
304 <div id="stuff">
2daa653a 305 <p>Well Now</p>
306 <p>Is the Time</p>
0d8f057e 307 </div>
308 BODY
309
310 my $output = $root
311 ->select('title')
312 ->replace_content('Hello World')
313 ->select('body')
314 ->replace_content($body)
2daa653a 315 ->select('#stuff p')
316 ->add_to_attribute(class=>'body')
0d8f057e 317 ->to_html;
318
319will produce:
320
321=begin testinfo
322
323 my $expect = <<HTML;
324
325=end testinfo
326
327 <html>
328 <head>
329 <title>Hello World</title>
330 </head>
331 <body><div id="stuff">
332 <p>Stuff</p>
333 </div>
334 </body>
335 </html>
336
337=begin testinfo
338
339 HTML
340 is($output, $expect, 'Synopsis code works ok');
341
342=end testinfo
244252e7 343
556c8616 344=head1 DESCRIPTION
345
346Given a L<HTML::Zoom> stream, provide methods to apply filters which
347alter the content of that stream.
348
f6644c71 349=head1 METHODS
350
351This class defines the following public API
352
353=head2 set_attribute
354
355 TBD
356
2daa653a 357=head2 add_to_attribute
f6644c71 358
359 TBD
360
361=head2 remove_attribute
362
363 TBD
364
365=head2 collect
366
367 TBD
368
369=head2 collect_content
370
371 TBD
372
373=head2 add_before
374
375 TBD
376
377=head2 add_after
378
379 TBD
380
381=head2 prepend_content
382
383 TBD
384
385=head2 append_content
386
387 TBD
388
389=head2 replace
390
391 TBD
392
393=head2 replace_content
394
244252e7 395Given a L<HTML::Zoom/select> result, replace the content with a string, array
396or another L<HTML::Zoom> object.
f6644c71 397
398=head2 repeat
399
400 TBD
401
402=head2 repeat_content
403
404 TBD
405
556c8616 406=head1 ALSO SEE
407
408L<HTML::Zoom>
409
410=head1 AUTHORS
411
412See L<HTML::Zoom> for authors.
413
414=head1 LICENSE
415
416See L<HTML::Zoom> for the license.
417
418=cut
419