Added more tests and rollback/commit are kinda working
[dbsrgits/DBM-Deep.git] / lib / DBM / Deep / Engine3.pm
CommitLineData
696cadb7 1package DBM::Deep::Engine3;
2
3use 5.6.0;
4
5use strict;
6
7our $VERSION = q(0.99_03);
8
696cadb7 9use Scalar::Util ();
10
11# File-wide notes:
8fbac729 12# * Every method in here assumes that the storage has been appropriately
696cadb7 13# safeguarded. This can be anything from flock() to some sort of manual
14# mutex. But, it's the caller's responsability to make sure that this has
15# been done.
16
17# Setup file and tag signatures. These should never change.
18sub SIG_FILE () { 'DPDB' }
19sub SIG_HEADER () { 'h' }
20sub SIG_INTERNAL () { 'i' }
21sub SIG_HASH () { 'H' }
22sub SIG_ARRAY () { 'A' }
23sub SIG_NULL () { 'N' }
24sub SIG_DATA () { 'D' }
25sub SIG_INDEX () { 'I' }
26sub SIG_BLIST () { 'B' }
27sub SIG_FREE () { 'F' }
28sub SIG_KEYS () { 'K' }
29sub SIG_SIZE () { 1 }
30
696cadb7 31################################################################################
32
8fbac729 33# Please refer to the pack() documentation for further information
34my %StP = (
ad4ae302 35 1 => 'C', # Unsigned char value
8fbac729 36 2 => 'n', # Unsigned short in "network" (big-endian) order
37 4 => 'N', # Unsigned long in "network" (big-endian) order
38 8 => 'Q', # Usigned quad (no order specified, presumably machine-dependent)
c83524c6 39);
40
696cadb7 41sub new {
42 my $class = shift;
43 my ($args) = @_;
44
6f999f6e 45 print "\n********* NEW ********\n\n";
696cadb7 46 my $self = bless {
c83524c6 47 byte_size => 4,
696cadb7 48
c83524c6 49 digest => undef,
696cadb7 50 hash_size => 16, # In bytes
51 max_buckets => 16,
3976d8c9 52 num_txns => 16, # HEAD plus 15 running txns
8cb9205a 53 trans_id => 0, # Default to the HEAD
696cadb7 54
6f999f6e 55 entries => {}, # This is the list of entries for transactions
696cadb7 56 storage => undef,
696cadb7 57 }, $class;
58
59 if ( defined $args->{pack_size} ) {
60 if ( lc $args->{pack_size} eq 'small' ) {
c83524c6 61 $args->{byte_size} = 2;
696cadb7 62 }
63 elsif ( lc $args->{pack_size} eq 'medium' ) {
c83524c6 64 $args->{byte_size} = 4;
696cadb7 65 }
66 elsif ( lc $args->{pack_size} eq 'large' ) {
c83524c6 67 $args->{byte_size} = 8;
696cadb7 68 }
69 else {
70 die "Unknown pack_size value: '$args->{pack_size}'\n";
71 }
72 }
73
74 # Grab the parameters we want to use
75 foreach my $param ( keys %$self ) {
76 next unless exists $args->{$param};
77 $self->{$param} = $args->{$param};
78 }
696cadb7 79
8fbac729 80 $self->{byte_pack} = $StP{ $self->byte_size };
c83524c6 81
696cadb7 82 ##
83 # Number of buckets per blist before another level of indexing is
84 # done. Increase this value for slightly greater speed, but larger database
85 # files. DO NOT decrease this value below 16, due to risk of recursive
86 # reindex overrun.
87 ##
88 if ( $self->{max_buckets} < 16 ) {
89 warn "Floor of max_buckets is 16. Setting it to 16 from '$self->{max_buckets}'\n";
90 $self->{max_buckets} = 16;
91 }
92
c83524c6 93 if ( !$self->{digest} ) {
94 require Digest::MD5;
95 $self->{digest} = \&Digest::MD5::md5;
96 }
97
696cadb7 98 return $self;
99}
100
101################################################################################
102
103sub read_value {
104 my $self = shift;
c9f02899 105 my ($obj, $key) = @_;
3976d8c9 106
107 # This will be a Reference sector
c9f02899 108 my $sector = $self->_load_sector( $obj->_base_offset )
109 or die "How did read_value fail (no sector for '$obj')?!\n";
3976d8c9 110
111 my $key_md5 = $self->_apply_digest( $key );
112
2432d6cc 113 my $value_sector = $sector->get_data_for({
114 key_md5 => $key_md5,
115 allow_head => 1,
116 });
3976d8c9 117
2432d6cc 118 unless ( $value_sector ) {
4056dff7 119 $value_sector = DBM::Deep::Engine::Sector::Null->new({
120 engine => $self,
121 data => undef,
122 });
123
2432d6cc 124 $sector->write_data({
125 key_md5 => $key_md5,
126 key => $key,
127 value => $value_sector,
128 });
4056dff7 129 }
3976d8c9 130
131 return $value_sector->data;
696cadb7 132}
133
84467b9f 134sub get_classname {
135 my $self = shift;
c9f02899 136 my ($obj) = @_;
84467b9f 137
138 # This will be a Reference sector
c9f02899 139 my $sector = $self->_load_sector( $obj->_base_offset )
140 or die "How did read_value fail (no sector for '$obj')?!\n";
84467b9f 141
142 return $sector->get_classname;
143}
144
696cadb7 145sub key_exists {
146 my $self = shift;
c9f02899 147 my ($obj, $key) = @_;
c000ae6e 148
149 # This will be a Reference sector
c9f02899 150 my $sector = $self->_load_sector( $obj->_base_offset )
151 or die "How did key_exists fail (no sector for '$obj')?!\n";
c000ae6e 152
2432d6cc 153 my $data = $sector->get_data_for({
154 key_md5 => $self->_apply_digest( $key ),
155 allow_head => 1,
156 });
c000ae6e 157
e86cef36 158 # exists() returns 1 or '' for true/false.
2432d6cc 159 return $data ? 1 : '';
696cadb7 160}
161
162sub delete_key {
163 my $self = shift;
c9f02899 164 my ($obj, $key) = @_;
e86cef36 165
c9f02899 166 my $sector = $self->_load_sector( $obj->_base_offset )
167 or die "How did delete_key fail (no sector for '$obj')?!\n";
e86cef36 168
2432d6cc 169 return $sector->delete_key({
170 key_md5 => $self->_apply_digest( $key ),
171 allow_head => 0,
172 });
696cadb7 173}
174
175sub write_value {
176 my $self = shift;
c9f02899 177 my ($obj, $key, $value) = @_;
3976d8c9 178
764e6cb9 179 my $r = Scalar::Util::reftype( $value ) || '';
d49782fe 180 {
181 last if $r eq '';
182 last if $r eq 'HASH';
183 last if $r eq 'ARRAY';
184
185 DBM::Deep->_throw_error(
186 "Storage of references of type '$r' is not supported."
187 );
188 }
189
764e6cb9 190 my ($class, $type);
68369f26 191 if ( !defined $value ) {
4eee718c 192 $class = 'DBM::Deep::Engine::Sector::Null';
68369f26 193 }
764e6cb9 194 elsif ( $r eq 'ARRAY' || $r eq 'HASH' ) {
d49782fe 195 if ( $r eq 'ARRAY' && tied(@$value) ) {
25eb38b8 196 DBM::Deep->_throw_error( "Cannot store something that is tied." );
d49782fe 197 }
198 if ( $r eq 'HASH' && tied(%$value) ) {
25eb38b8 199 DBM::Deep->_throw_error( "Cannot store something that is tied." );
d49782fe 200 }
764e6cb9 201 $class = 'DBM::Deep::Engine::Sector::Reference';
ed38e772 202 $type = substr( $r, 0, 1 );
764e6cb9 203 }
68369f26 204 else {
4eee718c 205 $class = 'DBM::Deep::Engine::Sector::Scalar';
68369f26 206 }
3976d8c9 207
2432d6cc 208 # This will be a Reference sector
209 my $sector = $self->_load_sector( $obj->_base_offset )
210 or die "How did write_value fail (no sector for '$obj')?!\n";
ed38e772 211
2432d6cc 212 # Create this after loading the reference sector in case something bad happens.
213 # This way, we won't allocate value sector(s) needlessly.
4eee718c 214 my $value_sector = $class->new({
215 engine => $self,
216 data => $value,
764e6cb9 217 type => $type,
4eee718c 218 });
219
2432d6cc 220 $sector->write_data({
221 key => $key,
222 key_md5 => $self->_apply_digest( $key ),
223 value => $value_sector,
224 });
764e6cb9 225
226 # This code is to make sure we write all the values in the $value to the disk
ed38e772 227 # and to make sure all changes to $value after the assignment are reflected
228 # on disk. This may be counter-intuitive at first, but it is correct dwimmery.
229 # NOTE - simply tying $value won't perform a STORE on each value. Hence, the
230 # copy to a temp value.
764e6cb9 231 if ( $r eq 'ARRAY' ) {
ed38e772 232 my @temp = @$value;
764e6cb9 233 tie @$value, 'DBM::Deep', {
234 base_offset => $value_sector->offset,
235 storage => $self->storage,
c9f02899 236 engine => $self,
764e6cb9 237 };
ed38e772 238 @$value = @temp;
764e6cb9 239 bless $value, 'DBM::Deep::Array' unless Scalar::Util::blessed( $value );
240 }
241 elsif ( $r eq 'HASH' ) {
ed38e772 242 my %temp = %$value;
764e6cb9 243 tie %$value, 'DBM::Deep', {
244 base_offset => $value_sector->offset,
245 storage => $self->storage,
c9f02899 246 engine => $self,
764e6cb9 247 };
ed38e772 248
249 %$value = %temp;
764e6cb9 250 bless $value, 'DBM::Deep::Hash' unless Scalar::Util::blessed( $value );
251 }
252
253 return 1;
696cadb7 254}
255
256sub get_next_key {
257 my $self = shift;
c9f02899 258 my ($obj, $prev_key) = @_;
ed38e772 259
260 # XXX Need to add logic about resetting the iterator if any key in the reference has changed
261 unless ( $prev_key ) {
c9f02899 262 $obj->{iterator} = DBM::Deep::Engine::Iterator->new({
263 base_offset => $obj->_base_offset,
ed38e772 264 engine => $self,
265 });
4eee718c 266 }
267
c9f02899 268 return $obj->{iterator}->get_next_key;
696cadb7 269}
270
271################################################################################
272
273sub setup_fh {
274 my $self = shift;
275 my ($obj) = @_;
276
277 # We're opening the file.
278 unless ( $obj->_base_offset ) {
696cadb7 279 my $bytes_read = $self->_read_file_header;
696cadb7 280
281 # Creating a new file
282 unless ( $bytes_read ) {
283 $self->_write_file_header;
c83524c6 284
285 # 1) Create Array/Hash entry
8fbac729 286 my $initial_reference = DBM::Deep::Engine::Sector::Reference->new({
287 engine => $self,
288 type => $obj->_type,
289 });
290 $obj->{base_offset} = $initial_reference->offset;
c83524c6 291
8fbac729 292 $self->storage->flush;
696cadb7 293 }
294 # Reading from an existing file
295 else {
296 $obj->{base_offset} = $bytes_read;
764e6cb9 297 my $initial_reference = DBM::Deep::Engine::Sector::Reference->new({
298 engine => $self,
299 offset => $obj->_base_offset,
300 });
301 unless ( $initial_reference ) {
696cadb7 302 DBM::Deep->_throw_error("Corrupted file, no master index record");
303 }
304
764e6cb9 305 unless ($obj->_type eq $initial_reference->type) {
696cadb7 306 DBM::Deep->_throw_error("File type mismatch");
307 }
308 }
309 }
696cadb7 310
696cadb7 311 return 1;
312}
313
8cb9205a 314sub begin_work {
c9f02899 315 my $self = shift;
8cb9205a 316 my ($obj) = @_;
317
318 if ( $self->trans_id ) {
6f999f6e 319 DBM::Deep->_throw_error( "Cannot begin_work within a transaction" );
8cb9205a 320 }
321
322 my @slots = $self->read_transaction_slots;
323 for my $i ( 1 .. @slots ) {
324 next if $slots[$i];
325 $slots[$i] = 1;
326 $self->set_trans_id( $i );
327 last;
328 }
329 $self->write_transaction_slots( @slots );
330
331 if ( !$self->trans_id ) {
6f999f6e 332 DBM::Deep->_throw_error( "Cannot begin_work - no available transactions" );
8cb9205a 333 }
334
335 return;
c9f02899 336}
696cadb7 337
8cb9205a 338sub rollback {
696cadb7 339 my $self = shift;
8cb9205a 340 my ($obj) = @_;
341
342 if ( !$self->trans_id ) {
6f999f6e 343 DBM::Deep->_throw_error( "Cannot rollback without a transaction" );
344 }
345
346 # Each entry is the file location for a bucket that has a modification for
347 # this transaction. The entries need to be expunged.
348 foreach my $entry (@{ $self->get_entries } ) {
349 # Remove the entry here
350 my $read_loc = $entry
351 + $self->hash_size
352 + $self->byte_size
353 + $self->trans_id * $self->byte_size;
354
355 my $data_loc = $self->storage->read_at( $read_loc, $self->byte_size );
356 $data_loc = unpack( $StP{$self->byte_size}, $data_loc );
357 $self->storage->print_at( $read_loc, pack( $StP{$self->byte_size}, 0 ) );
358
359 if ( $data_loc > 1 ) {
360 $self->_load_sector( $data_loc )->free;
361 }
8cb9205a 362 }
6f999f6e 363
364 $self->clear_entries;
365
366 my @slots = $self->read_transaction_slots;
367 $slots[$self->trans_id] = 0;
368 $self->write_transaction_slots( @slots );
369 $self->set_trans_id( 0 );
370
371 return 1;
c9f02899 372}
696cadb7 373
8cb9205a 374sub commit {
c9f02899 375 my $self = shift;
8cb9205a 376 my ($obj) = @_;
377
378 if ( !$self->trans_id ) {
6f999f6e 379 DBM::Deep->_throw_error( "Cannot commit without a transaction" );
380 }
381
382 print "TID: " . $self->trans_id, $/;
383 foreach my $entry (@{ $self->get_entries } ) {
384 print "$entry\n";
385 # Overwrite the entry in head with the entry in trans_id
386 my $base = $entry
387 + $self->hash_size
388 + $self->byte_size;
389
390 my $head_loc = $self->storage->read_at( $base, $self->byte_size );
391 $head_loc = unpack( $StP{$self->byte_size}, $head_loc );
392 my $trans_loc = $self->storage->read_at(
393 $base + $self->trans_id * $self->byte_size, $self->byte_size,
394 );
395
396 $self->storage->print_at( $base, $trans_loc );
397 $self->storage->print_at(
398 $base + $self->trans_id * $self->byte_size,
399 pack( $StP{$self->byte_size}, 0 ),
400 );
401
402 if ( $head_loc > 1 ) {
403 $self->_load_sector( $head_loc )->free;
404 }
8cb9205a 405 }
6f999f6e 406
407 $self->clear_entries;
408
409 my @slots = $self->read_transaction_slots;
410 $slots[$self->trans_id] = 0;
411 $self->write_transaction_slots( @slots );
412 $self->set_trans_id( 0 );
413
414 return 1;
8cb9205a 415}
416
417sub read_transaction_slots {
418 my $self = shift;
419 return split '', unpack( "b32", $self->storage->read_at( $self->trans_loc, 4 ) );
420}
421
422sub write_transaction_slots {
423 my $self = shift;
424 $self->storage->print_at( $self->trans_loc,
425 pack( "b32", join('', @_) ),
426 );
c9f02899 427}
696cadb7 428
6f999f6e 429sub get_entries {
430 my $self = shift;
431 return [ keys %{ $self->{entries}{$self->trans_id} ||= {} } ];
432}
433
434sub add_entry {
435 my $self = shift;
436 my ($trans_id, $loc) = @_;
437
438 print "$trans_id => $loc\n";
439 $self->{entries}{$trans_id} ||= {};
440 $self->{entries}{$trans_id}{$loc} = undef;
441 use Data::Dumper;print "$self: " . Dumper $self->{entries};
442}
443
444sub clear_entries {
445 my $self = shift;
446 print "Clearing\n";
447 delete $self->{entries}{$self->trans_id};
448}
449
c9f02899 450################################################################################
b9ec359f 451
c9f02899 452{
453 my $header_fixed = length( SIG_FILE ) + 1 + 4 + 4;
696cadb7 454
c9f02899 455 sub _write_file_header {
456 my $self = shift;
696cadb7 457
c9f02899 458 my $header_var = 1 + 1 + 4 + 2 * $self->byte_size;
696cadb7 459
c9f02899 460 my $loc = $self->storage->request_space( $header_fixed + $header_var );
c83524c6 461
c9f02899 462 $self->storage->print_at( $loc,
463 SIG_FILE,
464 SIG_HEADER,
465 pack('N', 1), # header version - at this point, we're at 9 bytes
466 pack('N', $header_var), # header size
467 # --- Above is $header_fixed. Below is $header_var
468 pack('C', $self->byte_size),
469 pack('C', $self->max_buckets),
470 pack('N', 0 ), # Running transactions
471 pack($StP{$self->byte_size}, 0), # Start of free chain (blist size)
472 pack($StP{$self->byte_size}, 0), # Start of free chain (data size)
473 );
696cadb7 474
c9f02899 475 $self->set_trans_loc( $header_fixed + 2 );
476 $self->set_chains_loc( $header_fixed + 6 );
696cadb7 477
c9f02899 478 return;
696cadb7 479 }
480
c9f02899 481 sub _read_file_header {
482 my $self = shift;
696cadb7 483
c9f02899 484 my $buffer = $self->storage->read_at( 0, $header_fixed );
485 return unless length($buffer);
696cadb7 486
c9f02899 487 my ($file_signature, $sig_header, $header_version, $size) = unpack(
488 'A4 A N N', $buffer
489 );
b9ec359f 490
c9f02899 491 unless ( $file_signature eq SIG_FILE ) {
492 $self->storage->close;
493 DBM::Deep->_throw_error( "Signature not found -- file is not a Deep DB" );
494 }
696cadb7 495
c9f02899 496 unless ( $sig_header eq SIG_HEADER ) {
497 $self->storage->close;
498 DBM::Deep->_throw_error( "Old file version found." );
499 }
696cadb7 500
c9f02899 501 my $buffer2 = $self->storage->read_at( undef, $size );
502 my @values = unpack( 'C C', $buffer2 );
696cadb7 503
c9f02899 504 $self->set_trans_loc( $header_fixed + 2 );
505 $self->set_chains_loc( $header_fixed + 6 );
506
507 if ( @values < 2 || grep { !defined } @values ) {
508 $self->storage->close;
509 DBM::Deep->_throw_error("Corrupted file - bad header");
510 }
511
512 #XXX Add warnings if values weren't set right
513 @{$self}{qw(byte_size max_buckets)} = @values;
b9ec359f 514
c9f02899 515 my $header_var = 1 + 1 + 4 + 2 * $self->byte_size;
516 unless ( $size eq $header_var ) {
517 $self->storage->close;
518 DBM::Deep->_throw_error( "Unexpected size found ($size <-> $header_var)." );
519 }
520
521 return length($buffer) + length($buffer2);
522 }
696cadb7 523}
524
3976d8c9 525sub _load_sector {
526 my $self = shift;
527 my ($offset) = @_;
528
529 my $type = $self->storage->read_at( $offset, 1 );
b9ec359f 530 return if $type eq chr(0);
531
3976d8c9 532 if ( $type eq $self->SIG_ARRAY || $type eq $self->SIG_HASH ) {
533 return DBM::Deep::Engine::Sector::Reference->new({
534 engine => $self,
535 type => $type,
536 offset => $offset,
537 });
538 }
2432d6cc 539 # XXX Don't we need key_md5 here?
3976d8c9 540 elsif ( $type eq $self->SIG_BLIST ) {
541 return DBM::Deep::Engine::Sector::BucketList->new({
542 engine => $self,
543 type => $type,
544 offset => $offset,
545 });
546 }
68369f26 547 elsif ( $type eq $self->SIG_NULL ) {
548 return DBM::Deep::Engine::Sector::Null->new({
549 engine => $self,
550 type => $type,
551 offset => $offset,
552 });
553 }
554 elsif ( $type eq $self->SIG_DATA ) {
555 return DBM::Deep::Engine::Sector::Scalar->new({
556 engine => $self,
557 type => $type,
558 offset => $offset,
559 });
560 }
b9ec359f 561 # This was deleted from under us, so just return and let the caller figure it out.
562 elsif ( $type eq $self->SIG_FREE ) {
563 return;
564 }
3976d8c9 565
ed38e772 566 die "'$offset': Don't know what to do with type '$type'\n";
3976d8c9 567}
568
569sub _apply_digest {
570 my $self = shift;
571 return $self->{digest}->(@_);
572}
573
ed38e772 574sub _add_free_sector {
575 my $self = shift;
576 my ($offset, $size) = @_;
b9ec359f 577
578 my $chains_offset;
579 # Data sector
580 if ( $size == 256 ) {
581 $chains_offset = $self->byte_size;
582 }
583 # Blist sector
584 else {
585 $chains_offset = 0;
586 }
587
588 my $old_head = $self->storage->read_at( $self->chains_loc + $chains_offset, $self->byte_size );
589
3ed26433 590 $self->storage->print_at( $self->chains_loc + $chains_offset,
b9ec359f 591 pack( $StP{$self->byte_size}, $offset ),
592 );
593
594 # Record the old head in the new sector after the signature
595 $self->storage->print_at( $offset + 1, $old_head );
596}
597
598sub _request_sector {
599 my $self = shift;
600 my ($size) = @_;
601
602 my $chains_offset;
603 # Data sector
604 if ( $size == 256 ) {
605 $chains_offset = $self->byte_size;
606 }
607 # Blist sector
608 else {
609 $chains_offset = 0;
610 }
611
612 my $old_head = $self->storage->read_at( $self->chains_loc + $chains_offset, $self->byte_size );
613 my $loc = unpack( $StP{$self->byte_size}, $old_head );
614
615 # We don't have any free sectors of the right size, so allocate a new one.
616 unless ( $loc ) {
617 return $self->storage->request_space( $size );
618 }
619
620 my $new_head = $self->storage->read_at( $loc + 1, $self->byte_size );
621 $self->storage->print_at( $self->chains_loc + $chains_offset, $new_head );
622
623 return $loc;
ed38e772 624}
625
696cadb7 626################################################################################
627
3976d8c9 628sub storage { $_[0]{storage} }
629sub byte_size { $_[0]{byte_size} }
630sub hash_size { $_[0]{hash_size} }
631sub num_txns { $_[0]{num_txns} }
632sub max_buckets { $_[0]{max_buckets} }
c000ae6e 633sub blank_md5 { chr(0) x $_[0]->hash_size }
8fbac729 634
8cb9205a 635sub trans_id { $_[0]{trans_id} }
636sub set_trans_id { $_[0]{trans_id} = $_[1] }
637
c9f02899 638sub trans_loc { $_[0]{trans_loc} }
639sub set_trans_loc { $_[0]{trans_loc} = $_[1] }
640
b9ec359f 641sub chains_loc { $_[0]{chains_loc} }
642sub set_chains_loc { $_[0]{chains_loc} = $_[1] }
643
8fbac729 644################################################################################
645
ed38e772 646package DBM::Deep::Engine::Iterator;
647
648sub new {
649 my $class = shift;
650 my ($args) = @_;
651
652 my $self = bless {
653 breadcrumbs => [],
654 engine => $args->{engine},
655 base_offset => $args->{base_offset},
ed38e772 656 }, $class;
657
658 Scalar::Util::weaken( $self->{engine} );
659
660 return $self;
661}
662
663sub reset {
664 my $self = shift;
665 $self->{breadcrumbs} = [];
666}
667
668sub get_next_key {
669 my $self = shift;
670
671 my $crumbs = $self->{breadcrumbs};
672
673 unless ( @$crumbs ) {
674 # This will be a Reference sector
675 my $sector = $self->{engine}->_load_sector( $self->{base_offset} )
b9ec359f 676 # or die "Iterator: How did this fail (no ref sector for '$self->{base_offset}')?!\n";
677 # If no sector is found, thist must have been deleted from under us.
678 or return;
ed38e772 679 push @$crumbs, [ $sector->get_blist_loc, 0 ];
680 }
681
682 my $key;
683 while ( 1 ) {
684 my ($offset, $idx) = @{ $crumbs->[-1] };
685 unless ( $offset ) {
686 $self->reset;
687 last;
688 }
689
2432d6cc 690 if ( $idx >= $self->{engine}->max_buckets ) {
691 $self->reset;
692 last;
693 }
694
ed38e772 695 my $sector = $self->{engine}->_load_sector( $offset )
b9ec359f 696 or die "Iterator: How did this fail (no blist sector for '$offset')?!\n";
ed38e772 697
2432d6cc 698 #XXX Think this through!
699 my $loc = $sector->get_data_location_for({
700 idx => $idx,
701 });
702 unless ( $loc ) {
703 $crumbs->[-1][1]++;
704 next;
705 }
706
ed38e772 707 my $key_sector = $sector->get_key_for( $idx );
708 unless ( $key_sector ) {
709 $self->reset;
710 last;
711 }
712
713 $crumbs->[-1][1]++;
714 $key = $key_sector->data;
715 last;
716 }
717
718 return $key;
719}
720
3976d8c9 721package DBM::Deep::Engine::Sector;
722
723sub new {
724 my $self = bless $_[1], $_[0];
725 Scalar::Util::weaken( $self->{engine} );
726 $self->_init;
727 return $self;
728}
729sub _init {}
2432d6cc 730sub clone { die "Must be implemented in the child class" }
3976d8c9 731
732sub engine { $_[0]{engine} }
733sub offset { $_[0]{offset} }
734sub type { $_[0]{type} }
735
ed38e772 736sub free {
737 my $self = shift;
738
b9ec359f 739 $self->engine->storage->print_at( $self->offset,
740 $self->engine->SIG_FREE,
741 chr(0) x ($self->size - 1),
742 );
743
ed38e772 744 $self->engine->_add_free_sector(
745 $self->offset, $self->size,
746 );
747
b9ec359f 748 return;
ed38e772 749}
3976d8c9 750
751package DBM::Deep::Engine::Sector::Data;
8fbac729 752
753our @ISA = qw( DBM::Deep::Engine::Sector );
754
3976d8c9 755# This is in bytes
756sub size { return 256 }
757
2432d6cc 758sub clone {
759 my $self = shift;
760 return ref($self)->new({
761 engine => $self->engine,
762 data => $self->data,
763 type => $self->type,
764 });
765}
766
3976d8c9 767package DBM::Deep::Engine::Sector::Scalar;
768
769our @ISA = qw( DBM::Deep::Engine::Sector::Data );
770
ad4ae302 771sub free {
772 my $self = shift;
773
774 my $chain_loc = $self->chain_loc;
775
776 $self->SUPER::free();
777
778 if ( $chain_loc ) {
779 $self->engine->_load_sector( $chain_loc )->free;
780 }
781
782 return;
783}
784
3976d8c9 785sub type { $_[0]{engine}->SIG_DATA }
8fbac729 786sub _init {
787 my $self = shift;
788
789 my $engine = $self->engine;
790
3976d8c9 791 unless ( $self->offset ) {
ad4ae302 792 my $data_section = $self->size - 3 - 1 * $engine->byte_size;
3976d8c9 793
b9ec359f 794 $self->{offset} = $engine->_request_sector( $self->size );
ad4ae302 795
2432d6cc 796 my $data = delete $self->{data};
ad4ae302 797 my $dlen = length $data;
798 my $continue = 1;
799 my $curr_offset = $self->offset;
800 while ( $continue ) {
801
802 my $next_offset = 0;
803
804 my ($leftover, $this_len, $chunk);
805 if ( $dlen > $data_section ) {
806 $leftover = 0;
807 $this_len = $data_section;
808 $chunk = substr( $data, 0, $this_len );
809
810 $dlen -= $data_section;
811 $next_offset = $engine->_request_sector( $self->size );
812 $data = substr( $data, $this_len );
813 }
814 else {
815 $leftover = $data_section - $dlen;
816 $this_len = $dlen;
817 $chunk = $data;
818
819 $continue = 0;
820 }
821
822 $engine->storage->print_at( $curr_offset,
823 $self->type, # Sector type
824 pack( $StP{1}, 0 ), # Recycled counter
825 pack( $StP{$engine->byte_size}, $next_offset ), # Chain loc
826 pack( $StP{1}, $this_len ), # Data length
827 $chunk, # Data to be stored in this sector
828 chr(0) x $leftover, # Zero-fill the rest
829 );
830
831 $curr_offset = $next_offset;
832 }
3976d8c9 833
834 return;
835 }
836}
837
838sub data_length {
839 my $self = shift;
840
ad4ae302 841 my $buffer = $self->engine->storage->read_at(
3976d8c9 842 $self->offset + 2 + $self->engine->byte_size, 1
8fbac729 843 );
ad4ae302 844
845 return unpack( $StP{1}, $buffer );
846}
847
848sub chain_loc {
849 my $self = shift;
850 my $chain_loc = $self->engine->storage->read_at(
851 $self->offset + 2, $self->engine->byte_size,
852 );
853 return unpack( $StP{$self->engine->byte_size}, $chain_loc );
3976d8c9 854}
855
856sub data {
857 my $self = shift;
8fbac729 858
378b4748 859 my $data;
860 while ( 1 ) {
861 my $chain_loc = $self->chain_loc;
ad4ae302 862
378b4748 863 $data .= $self->engine->storage->read_at(
864 $self->offset + 2 + $self->engine->byte_size + 1, $self->data_length,
865 );
ad4ae302 866
378b4748 867 last unless $chain_loc;
868
869 $self = $self->engine->_load_sector( $chain_loc );
ad4ae302 870 }
871
872 return $data;
8fbac729 873}
874
68369f26 875package DBM::Deep::Engine::Sector::Null;
876
877our @ISA = qw( DBM::Deep::Engine::Sector::Data );
878
879sub type { $_[0]{engine}->SIG_NULL }
880sub data_length { 0 }
881sub data { return }
882
883sub _init {
884 my $self = shift;
885
886 my $engine = $self->engine;
887
888 unless ( $self->offset ) {
889 my $leftover = $self->size - 3 - 1 * $engine->byte_size;
890
b9ec359f 891 $self->{offset} = $engine->_request_sector( $self->size );
68369f26 892 $engine->storage->print_at( $self->offset,
893 $self->type, # Sector type
894 pack( $StP{1}, 0 ), # Recycled counter
895 pack( $StP{$engine->byte_size}, 0 ), # Chain loc
896 pack( $StP{1}, $self->data_length ), # Data length
897 chr(0) x $leftover, # Zero-fill the rest
898 );
899
900 return;
901 }
902}
903
3976d8c9 904package DBM::Deep::Engine::Sector::Reference;
8fbac729 905
3976d8c9 906our @ISA = qw( DBM::Deep::Engine::Sector::Data );
907
908sub _init {
909 my $self = shift;
910
911 my $engine = $self->engine;
912
913 unless ( $self->offset ) {
ba075714 914 my $classname = Scalar::Util::blessed( delete $self->{data} );
d4f34951 915 my $leftover = $self->size - 4 - 2 * $engine->byte_size;
916
917 my $class_offset = 0;
918 if ( defined $classname ) {
919 my $class_sector = DBM::Deep::Engine::Sector::Scalar->new({
920 engine => $self->engine,
921 data => $classname,
922 });
923 $class_offset = $class_sector->offset;
924 }
3976d8c9 925
b9ec359f 926 $self->{offset} = $engine->_request_sector( $self->size );
3976d8c9 927 $engine->storage->print_at( $self->offset,
d4f34951 928 $self->type, # Sector type
929 pack( $StP{1}, 0 ), # Recycled counter
930 pack( $StP{$engine->byte_size}, 0 ), # Index/BList loc
931 pack( $StP{$engine->byte_size}, $class_offset ), # Classname loc
932 chr(0) x $leftover, # Zero-fill the rest
3976d8c9 933 );
934
935 return;
936 }
764e6cb9 937
938 $self->{type} = $engine->storage->read_at( $self->offset, 1 );
939
940 return;
3976d8c9 941}
942
2432d6cc 943sub get_data_for {
944 my $self = shift;
945 my ($args) = @_;
946
947 # Assume that the head is not allowed unless otherwise specified.
948 $args->{allow_head} = 0 unless exists $args->{allow_head};
949
950 # Assume we don't create a new blist location unless otherwise specified.
951 $args->{create} = 0 unless exists $args->{create};
952
953 my $blist = $self->get_bucket_list({
954 key_md5 => $args->{key_md5},
955 create => $args->{create},
956 });
957 return unless $blist && $blist->{found};
958
959 # At this point, $blist knows where the md5 is. What it -doesn't- know yet
960 # is whether or not this transaction has this key. That's part of the next
961 # function call.
962 my $location = $blist->get_data_location_for({
963 allow_head => $args->{allow_head},
964 }) or return;
965
966 return $self->engine->_load_sector( $location );
967}
968
969sub write_data {
970 my $self = shift;
971 my ($args) = @_;
972
973 my $blist = $self->get_bucket_list({
974 key_md5 => $args->{key_md5},
975 create => 1,
6f999f6e 976 }) or die "How did write_data fail (no blist)?!\n";
2432d6cc 977
978 # Handle any transactional bookkeeping.
979 if ( $self->engine->trans_id ) {
980 if ( ! $blist->{found} ) {
981 $blist->mark_deleted({
982 trans_id => 0,
983 });
984 }
985 }
986 else {
987 my @transactions = $self->engine->read_transaction_slots;
988 my @trans_ids = grep { $transactions[$_] } 0 .. $#transactions;
989 if ( $blist->{found} ) {
990 if ( @trans_ids ) {
991 my $old_value = $blist->get_data_for;
992 foreach my $other_trans_id ( @trans_ids ) {
993 next if $blist->get_data_location_for({ trans_id => $other_trans_id, allow_head => 0 });
6f999f6e 994 print "write_md5 to save a value\n";
2432d6cc 995 $blist->write_md5({
996 trans_id => $other_trans_id,
997 key => $args->{key},
998 key_md5 => $args->{key_md5},
999 value => $old_value->clone,
1000 });
1001 }
1002 }
1003 }
1004 else {
1005 if ( @trans_ids ) {
1006 foreach my $other_trans_id ( @trans_ids ) {
1007 next if $blist->get_data_location_for({ trans_id => $other_trans_id, allow_head => 0 });
1008 $blist->mark_deleted({
1009 trans_id => $other_trans_id,
1010 });
1011 }
1012 }
1013 }
1014 }
1015
6f999f6e 1016 #XXX Is this safe to do transactionally?
2432d6cc 1017 # Free the place we're about to write to.
1018 if ( $blist->get_data_location_for({ allow_head => 0 }) ) {
1019 $blist->get_data_for({ allow_head => 0 })->free;
1020 }
1021
1022 $blist->write_md5({
1023 key => $args->{key},
1024 key_md5 => $args->{key_md5},
1025 value => $args->{value},
1026 });
1027}
1028
1029sub delete_key {
1030 my $self = shift;
1031 my ($args) = @_;
1032
1033 # XXX What should happen if this fails?
1034 my $blist = $self->get_bucket_list({
1035 key_md5 => $args->{key_md5},
1036 }) or die "How did delete_key fail (no blist)?!\n";
1037
6f999f6e 1038 # Save the location so that we can free the data
1039 my $location = $blist->get_data_location_for({
1040 allow_head => 0,
1041 });
1042 my $old_value = $self->engine->_load_sector( $location );
1043
1044 if ( $self->engine->trans_id == 0 ) {
1045 my @transactions = $self->engine->read_transaction_slots;
1046 my @trans_ids = grep { $transactions[$_] } 0 .. $#transactions;
1047 if ( @trans_ids ) {
1048 foreach my $other_trans_id ( @trans_ids ) {
1049 next if $blist->get_data_location_for({ trans_id => $other_trans_id, allow_head => 0 });
1050 $blist->write_md5({
1051 trans_id => $other_trans_id,
1052 key => $args->{key},
1053 key_md5 => $args->{key_md5},
1054 value => $old_value->clone,
1055 });
1056 }
1057 }
1058 }
1059
1060 $blist->mark_deleted( $args );
1061
1062 my $data = $old_value->data;
1063 $old_value->free;
1064
1065 return $data;
2432d6cc 1066}
1067
3976d8c9 1068sub get_blist_loc {
1069 my $self = shift;
1070
2432d6cc 1071 my $e = $self->engine;
1072 my $blist_loc = $e->storage->read_at( $self->offset + 2, $e->byte_size );
1073 return unpack( $StP{$e->byte_size}, $blist_loc );
3976d8c9 1074}
1075
1076sub get_bucket_list {
1077 my $self = shift;
1078 my ($args) = @_;
4eee718c 1079 $args ||= {};
3976d8c9 1080
1081 # XXX Add in check here for recycling?
1082
1083 my $engine = $self->engine;
1084
1085 my $blist_loc = $self->get_blist_loc;
1086
1087 # There's no index or blist yet
1088 unless ( $blist_loc ) {
1089 return unless $args->{create};
1090
1091 my $blist = DBM::Deep::Engine::Sector::BucketList->new({
2432d6cc 1092 engine => $engine,
1093 key_md5 => $args->{key_md5},
3976d8c9 1094 });
2432d6cc 1095
d4f34951 1096 $engine->storage->print_at( $self->offset + 2,
3976d8c9 1097 pack( $StP{$engine->byte_size}, $blist->offset ),
1098 );
2432d6cc 1099
3976d8c9 1100 return $blist;
1101 }
1102
1103 return DBM::Deep::Engine::Sector::BucketList->new({
2432d6cc 1104 engine => $engine,
1105 offset => $blist_loc,
1106 key_md5 => $args->{key_md5},
3976d8c9 1107 });
1108}
1109
ba075714 1110sub get_classname {
1111 my $self = shift;
1112
d4f34951 1113 my $class_offset = $self->engine->storage->read_at(
1114 $self->offset + 2 + 1 * $self->engine->byte_size, $self->engine->byte_size,
ba075714 1115 );
d4f34951 1116 $class_offset = unpack ( $StP{$self->engine->byte_size}, $class_offset );
ba075714 1117
d4f34951 1118 return unless $class_offset;
ba075714 1119
d4f34951 1120 return $self->engine->_load_sector( $class_offset )->data;
ba075714 1121}
1122
764e6cb9 1123sub data {
1124 my $self = shift;
1125
1126 my $new_obj = DBM::Deep->new({
1127 type => $self->type,
1128 base_offset => $self->offset,
1129 storage => $self->engine->storage,
c9f02899 1130 engine => $self->engine,
764e6cb9 1131 });
1132
ba075714 1133 if ( $self->engine->storage->{autobless} ) {
1134 my $classname = $self->get_classname;
1135 if ( defined $classname ) {
1136 bless $new_obj, $classname;
1137 }
1138 }
1139
764e6cb9 1140 return $new_obj;
1141}
1142
3976d8c9 1143package DBM::Deep::Engine::Sector::BucketList;
1144
1145our @ISA = qw( DBM::Deep::Engine::Sector );
1146
4eee718c 1147sub idx_for_txn { return $_[1] + 1 }
1148
3976d8c9 1149sub _init {
1150 my $self = shift;
1151
1152 my $engine = $self->engine;
1153
1154 unless ( $self->offset ) {
c000ae6e 1155 my $leftover = $self->size - $self->base_size;
3976d8c9 1156
b9ec359f 1157 $self->{offset} = $engine->_request_sector( $self->size );
3976d8c9 1158 $engine->storage->print_at( $self->offset,
1159 $engine->SIG_BLIST, # Sector type
1160 pack( $StP{1}, 0 ), # Recycled counter
1161 chr(0) x $leftover, # Zero-fill the data
1162 );
1163 }
8fbac729 1164
2432d6cc 1165 if ( $self->{key_md5} ) {
1166 $self->find_md5;
1167 }
1168
8fbac729 1169 return $self;
1170}
8fbac729 1171
c000ae6e 1172sub base_size { 2 } # Sig + recycled counter
1173
3976d8c9 1174sub size {
1175 my $self = shift;
2432d6cc 1176 unless ( $self->{size} ) {
1177 my $e = $self->engine;
1178 $self->{size} = $self->base_size + $e->max_buckets * $self->bucket_size; # Base + numbuckets * bucketsize
1179 }
1180 return $self->{size};
c000ae6e 1181}
1182
1183sub bucket_size {
1184 my $self = shift;
2432d6cc 1185 unless ( $self->{bucket_size} ) {
1186 my $e = $self->engine;
1187 # Key + transactions
1188 my $locs_size = (1 + $e->num_txns ) * $e->byte_size;
1189 $self->{bucket_size} = $e->hash_size + $locs_size;
1190 }
1191 return $self->{bucket_size};
3976d8c9 1192}
8fbac729 1193
3976d8c9 1194sub has_md5 {
c000ae6e 1195 my $self = shift;
2432d6cc 1196 unless ( exists $self->{found} ) {
1197 $self->find_md5;
1198 }
1199 return $self->{found};
c000ae6e 1200}
1201
1202sub find_md5 {
1203 my $self = shift;
c000ae6e 1204
2432d6cc 1205 $self->{found} = undef;
1206 $self->{idx} = -1;
c000ae6e 1207
2432d6cc 1208 # If we don't have an MD5, then what are we supposed to do?
1209 unless ( exists $self->{key_md5} ) {
6f999f6e 1210 DBM::Deep->_throw_error( "Cannot find_md5 without a key_md5 set" );
2432d6cc 1211 }
8cb9205a 1212
2432d6cc 1213 my $e = $self->engine;
1214 foreach my $idx ( 0 .. $e->max_buckets - 1 ) {
1215 my $potential = $e->storage->read_at(
1216 $self->offset + $self->base_size + $idx * $self->bucket_size, $e->hash_size,
1217 );
1218
1219 if ( $potential eq $e->blank_md5 ) {
1220 $self->{idx} = $idx;
1221 return;
1222 }
8cb9205a 1223
2432d6cc 1224 if ( $potential eq $self->{key_md5} ) {
1225 $self->{found} = 1;
1226 $self->{idx} = $idx;
1227 return;
8cb9205a 1228 }
c000ae6e 1229 }
1230
1231 return;
3976d8c9 1232}
1233
1234sub write_md5 {
1235 my $self = shift;
2432d6cc 1236 my ($args) = @_;
2432d6cc 1237
6f999f6e 1238 DBM::Deep->_throw_error( "write_md5: no key" ) unless exists $args->{key};
1239 DBM::Deep->_throw_error( "write_md5: no key_md5" ) unless exists $args->{key_md5};
1240 DBM::Deep->_throw_error( "write_md5: no value" ) unless exists $args->{value};
3976d8c9 1241
1242 my $engine = $self->engine;
6f999f6e 1243
1244 $args->{trans_id} = $engine->trans_id unless exists $args->{trans_id};
1245
2432d6cc 1246 my $spot = $self->offset + $self->base_size + $self->{idx} * $self->bucket_size;
6f999f6e 1247 print "Adding $args->{trans_id} -> $spot\n";
1248 $engine->add_entry( $args->{trans_id}, $spot );
4eee718c 1249
2432d6cc 1250 unless ($self->{found}) {
4eee718c 1251 my $key_sector = DBM::Deep::Engine::Sector::Scalar->new({
6f999f6e 1252 engine => $engine,
2432d6cc 1253 data => $args->{key},
4eee718c 1254 });
1255
1256 $engine->storage->print_at( $spot,
2432d6cc 1257 $args->{key_md5},
6f999f6e 1258 pack( $StP{$engine->byte_size}, $key_sector->offset ),
4eee718c 1259 );
1260 }
1261
6f999f6e 1262 my $loc = $spot
2432d6cc 1263 + $engine->hash_size
1264 + $engine->byte_size
6f999f6e 1265 + $args->{trans_id} * $engine->byte_size;
1266
1267 $engine->storage->print_at( $loc,
2432d6cc 1268 pack( $StP{$engine->byte_size}, $args->{value}->offset ),
1269 );
1270}
1271
1272sub mark_deleted {
1273 my $self = shift;
1274 my ($args) = @_;
6f999f6e 1275 $args ||= {};
1276
1277 my $engine = $self->engine;
1278
1279 $args->{trans_id} = $engine->trans_id unless exists $args->{trans_id};
2432d6cc 1280
1281 my $spot = $self->offset + $self->base_size + $self->{idx} * $self->bucket_size;
6f999f6e 1282 $engine->add_entry( $args->{trans_id}, $spot );
1283
1284 my $loc = $spot
1285 + $engine->hash_size
1286 + $engine->byte_size
1287 + $args->{trans_id} * $engine->byte_size;
1288
1289 $engine->storage->print_at( $loc,
1290 pack( $StP{$engine->byte_size}, 1 ), # 1 is the marker for deleted
3976d8c9 1291 );
1292}
1293
e86cef36 1294sub delete_md5 {
3976d8c9 1295 my $self = shift;
2432d6cc 1296 my ($args) = @_;
3976d8c9 1297
e86cef36 1298 my $engine = $self->engine;
2432d6cc 1299 return undef unless $self->{found};
4eee718c 1300
1301 # Save the location so that we can free the data
2432d6cc 1302 my $location = $self->get_data_location_for({
1303 allow_head => 0,
1304 });
1305 my $key_sector = $self->get_key_for;
4eee718c 1306
6f999f6e 1307 #XXX This isn't going to work right and you know it! This eradicates data
1308 # that we're not ready to eradicate just yet.
2432d6cc 1309 my $spot = $self->offset + $self->base_size + $self->{idx} * $self->bucket_size;
4eee718c 1310 $engine->storage->print_at( $spot,
1311 $engine->storage->read_at(
1312 $spot + $self->bucket_size,
2432d6cc 1313 $self->bucket_size * ( $engine->num_txns - $self->{idx} - 1 ),
4eee718c 1314 ),
1315 chr(0) x $self->bucket_size,
e86cef36 1316 );
1317
3ed26433 1318 $key_sector->free;
1319
ed38e772 1320 my $data_sector = $self->engine->_load_sector( $location );
1321 my $data = $data_sector->data;
ed38e772 1322 $data_sector->free;
5c0f86e1 1323
1324 return $data;
e86cef36 1325}
1326
ed38e772 1327sub get_data_location_for {
e86cef36 1328 my $self = shift;
2432d6cc 1329 my ($args) = @_;
1330 $args ||= {};
1331
1332 $args->{allow_head} = 0 unless exists $args->{allow_head};
1333 $args->{trans_id} = $self->engine->trans_id unless exists $args->{trans_id};
1334 $args->{idx} = $self->{idx} unless exists $args->{idx};
e86cef36 1335
3976d8c9 1336 my $location = $self->engine->storage->read_at(
8cb9205a 1337 $self->offset + $self->base_size
2432d6cc 1338 + $args->{idx} * $self->bucket_size
8cb9205a 1339 + $self->engine->hash_size
1340 + $self->engine->byte_size
2432d6cc 1341 + $args->{trans_id} * $self->engine->byte_size,
4eee718c 1342 $self->engine->byte_size,
3976d8c9 1343 );
8cb9205a 1344 my $loc = unpack( $StP{$self->engine->byte_size}, $location );
1345
1346 # If we're in a transaction and we never wrote to this location, try the
1347 # HEAD instead.
2432d6cc 1348 if ( $args->{trans_id} && !$loc && $args->{allow_head} ) {
1349 return $self->get_data_location_for({
1350 trans_id => 0,
1351 allow_head => 1,
1352 });
8cb9205a 1353 }
2432d6cc 1354 return $loc <= 1 ? 0 : $loc;
e86cef36 1355}
1356
1357sub get_data_for {
1358 my $self = shift;
2432d6cc 1359 my ($args) = @_;
1360 $args ||= {};
e86cef36 1361
2432d6cc 1362 return unless $self->{found};
1363 my $location = $self->get_data_location_for({
1364 allow_head => $args->{allow_head},
1365 });
ed38e772 1366 return $self->engine->_load_sector( $location );
1367}
1368
1369sub get_key_for {
1370 my $self = shift;
1371 my ($idx) = @_;
2432d6cc 1372 $idx = $self->{idx} unless defined $idx;
ed38e772 1373
1374 my $location = $self->engine->storage->read_at(
1375 $self->offset + $self->base_size + $idx * $self->bucket_size + $self->engine->hash_size,
1376 $self->engine->byte_size,
1377 );
1378 $location = unpack( $StP{$self->engine->byte_size}, $location );
1379 return unless $location;
68369f26 1380 return $self->engine->_load_sector( $location );
3976d8c9 1381}
696cadb7 1382
13831;
1384__END__