Removed unneeded Fcntl imports in DBM::Deep
[dbsrgits/DBM-Deep.git] / lib / DBM / Deep.pm
CommitLineData
ffed8b01 1package DBM::Deep;
2
3##
4# DBM::Deep
5#
6# Description:
d0b74c17 7# Multi-level database module for storing hash trees, arrays and simple
8# key/value pairs into FTP-able, cross-platform binary database files.
ffed8b01 9#
d0b74c17 10# Type `perldoc DBM::Deep` for complete documentation.
ffed8b01 11#
12# Usage Examples:
d0b74c17 13# my %db;
14# tie %db, 'DBM::Deep', 'my_database.db'; # standard tie() method
ffed8b01 15#
d0b74c17 16# my $db = new DBM::Deep( 'my_database.db' ); # preferred OO method
17#
18# $db->{my_scalar} = 'hello world';
19# $db->{my_hash} = { larry => 'genius', hashes => 'fast' };
20# $db->{my_array} = [ 1, 2, 3, time() ];
21# $db->{my_complex} = [ 'hello', { perl => 'rules' }, 42, 99 ];
22# push @{$db->{my_array}}, 'another value';
23# my @key_list = keys %{$db->{my_hash}};
24# print "This module " . $db->{my_complex}->[1]->{perl} . "!\n";
ffed8b01 25#
26# Copyright:
d0b74c17 27# (c) 2002-2006 Joseph Huckaby. All Rights Reserved.
28# This program is free software; you can redistribute it and/or
29# modify it under the same terms as Perl itself.
ffed8b01 30##
31
460b1067 32use 5.6.0;
33
ffed8b01 34use strict;
460b1067 35use warnings;
8b957036 36
d8db2929 37our $VERSION = q(0.99_03);
86867f3a 38
05be6af2 39use Fcntl qw( :flock );
12b96196 40
41use Clone::Any '_clone_data';
ffed8b01 42use Digest::MD5 ();
a8fdabda 43use FileHandle::Fmode ();
ffed8b01 44use Scalar::Util ();
ffed8b01 45
696cadb7 46use DBM::Deep::Engine3;
460b1067 47use DBM::Deep::File;
95967a5e 48
ffed8b01 49##
50# Setup constants for users to pass to new()
51##
696cadb7 52sub TYPE_HASH () { DBM::Deep::Engine3->SIG_HASH }
53sub TYPE_ARRAY () { DBM::Deep::Engine3->SIG_ARRAY }
ffed8b01 54
696cadb7 55# This is used in all the children of this class in their TIE<type> methods.
0ca7ea98 56sub _get_args {
57 my $proto = shift;
58
59 my $args;
60 if (scalar(@_) > 1) {
61 if ( @_ % 2 ) {
62 $proto->_throw_error( "Odd number of parameters to " . (caller(1))[2] );
63 }
64 $args = {@_};
65 }
d0b74c17 66 elsif ( ref $_[0] ) {
4d35d856 67 unless ( eval { local $SIG{'__DIE__'}; %{$_[0]} || 1 } ) {
0ca7ea98 68 $proto->_throw_error( "Not a hashref in args to " . (caller(1))[2] );
69 }
70 $args = $_[0];
71 }
d0b74c17 72 else {
0ca7ea98 73 $args = { file => shift };
74 }
75
76 return $args;
77}
78
ffed8b01 79sub new {
d0b74c17 80 ##
81 # Class constructor method for Perl OO interface.
82 # Calls tie() and returns blessed reference to tied hash or array,
83 # providing a hybrid OO/tie interface.
84 ##
85 my $class = shift;
86 my $args = $class->_get_args( @_ );
87
88 ##
89 # Check if we want a tied hash or array.
90 ##
91 my $self;
92 if (defined($args->{type}) && $args->{type} eq TYPE_ARRAY) {
6fe26b29 93 $class = 'DBM::Deep::Array';
94 require DBM::Deep::Array;
d0b74c17 95 tie @$self, $class, %$args;
96 }
97 else {
6fe26b29 98 $class = 'DBM::Deep::Hash';
99 require DBM::Deep::Hash;
d0b74c17 100 tie %$self, $class, %$args;
101 }
ffed8b01 102
d0b74c17 103 return bless $self, $class;
ffed8b01 104}
105
96041a25 106# This initializer is called from the various TIE* methods. new() calls tie(),
107# which allows for a single point of entry.
0795f290 108sub _init {
0795f290 109 my $class = shift;
994ccd8e 110 my ($args) = @_;
0795f290 111
83371fe3 112 $args->{storage} = DBM::Deep::File->new( $args )
113 unless exists $args->{storage};
460b1067 114
115 # locking implicitly enables autoflush
116 if ($args->{locking}) { $args->{autoflush} = 1; }
117
0795f290 118 # These are the defaults to be optionally overridden below
119 my $self = bless {
95967a5e 120 type => TYPE_HASH,
e06824f8 121 base_offset => undef,
359a01ac 122
83371fe3 123 storage => undef,
c9f02899 124 engine => undef,
0795f290 125 }, $class;
c9f02899 126
127 $args->{engine} = DBM::Deep::Engine3->new( { %{$args}, obj => $self } )
128 unless exists $args->{engine};
8db25060 129
fde3db1a 130 # Grab the parameters we want to use
0795f290 131 foreach my $param ( keys %$self ) {
132 next unless exists $args->{$param};
3e9498a1 133 $self->{$param} = $args->{$param};
ffed8b01 134 }
d0b74c17 135
696cadb7 136 eval {
137 local $SIG{'__DIE__'};
3ed26433 138
696cadb7 139 $self->lock;
140 $self->_engine->setup_fh( $self );
3ed26433 141 $self->_storage->set_inode;
696cadb7 142 $self->unlock;
143 }; if ( $@ ) {
144 my $e = $@;
145 eval { local $SIG{'__DIE__'}; $self->unlock; };
146 die $e;
147 }
359a01ac 148
0795f290 149 return $self;
ffed8b01 150}
151
ffed8b01 152sub TIEHASH {
6fe26b29 153 shift;
154 require DBM::Deep::Hash;
155 return DBM::Deep::Hash->TIEHASH( @_ );
ffed8b01 156}
157
158sub TIEARRAY {
6fe26b29 159 shift;
160 require DBM::Deep::Array;
161 return DBM::Deep::Array->TIEARRAY( @_ );
ffed8b01 162}
163
ffed8b01 164sub lock {
994ccd8e 165 my $self = shift->_get_self;
83371fe3 166 return $self->_storage->lock( $self, @_ );
ffed8b01 167}
168
169sub unlock {
994ccd8e 170 my $self = shift->_get_self;
83371fe3 171 return $self->_storage->unlock( $self, @_ );
ffed8b01 172}
173
906c8e01 174sub _copy_value {
175 my $self = shift->_get_self;
176 my ($spot, $value) = @_;
177
178 if ( !ref $value ) {
179 ${$spot} = $value;
180 }
181 elsif ( eval { local $SIG{__DIE__}; $value->isa( 'DBM::Deep' ) } ) {
f9c33187 182 ${$spot} = $value->_repr;
906c8e01 183 $value->_copy_node( ${$spot} );
184 }
185 else {
186 my $r = Scalar::Util::reftype( $value );
187 my $c = Scalar::Util::blessed( $value );
188 if ( $r eq 'ARRAY' ) {
189 ${$spot} = [ @{$value} ];
190 }
191 else {
192 ${$spot} = { %{$value} };
193 }
95bbd935 194 ${$spot} = bless ${$spot}, $c
906c8e01 195 if defined $c;
196 }
197
198 return 1;
199}
200
261d1296 201sub _copy_node {
f9c33187 202 die "Must be implemented in a child class\n";
203}
906c8e01 204
f9c33187 205sub _repr {
206 die "Must be implemented in a child class\n";
ffed8b01 207}
208
209sub export {
d0b74c17 210 ##
211 # Recursively export into standard Perl hashes and arrays.
212 ##
994ccd8e 213 my $self = shift->_get_self;
d0b74c17 214
f9c33187 215 my $temp = $self->_repr;
d0b74c17 216
217 $self->lock();
218 $self->_copy_node( $temp );
219 $self->unlock();
220
c9f02899 221 my $classname = $self->_engine->get_classname( $self );
84467b9f 222 if ( defined $classname ) {
223 bless $temp, $classname;
68f943b3 224 }
225
d0b74c17 226 return $temp;
ffed8b01 227}
228
229sub import {
d0b74c17 230 ##
231 # Recursively import Perl hash/array structure
232 ##
d0b74c17 233 if (!ref($_[0])) { return; } # Perl calls import() on use -- ignore
234
994ccd8e 235 my $self = shift->_get_self;
236 my ($struct) = @_;
d0b74c17 237
c9cec40e 238 # struct is not a reference, so just import based on our type
d0b74c17 239 if (!ref($struct)) {
f9c33187 240 $struct = $self->_repr( @_ );
d0b74c17 241 }
242
12b96196 243 #XXX This isn't the best solution. Better would be to use Data::Walker,
244 #XXX but that's a lot more thinking than I want to do right now.
7a960a12 245 eval {
84467b9f 246 #$self->begin_work;
12b96196 247 $self->_import( _clone_data( $struct ) );
84467b9f 248 #$self->commit;
7a960a12 249 }; if ( $@ ) {
84467b9f 250 #$self->rollback;
7a960a12 251 die $@;
252 }
253
254 return 1;
ffed8b01 255}
256
13ff93d5 257#XXX Need to keep track of who has a fh to this file in order to
258#XXX close them all prior to optimize on Win32/cygwin
ffed8b01 259sub optimize {
d0b74c17 260 ##
261 # Rebuild entire database into new file, then move
262 # it back on top of original.
263 ##
994ccd8e 264 my $self = shift->_get_self;
cc4bef86 265
266#XXX Need to create a new test for this
83371fe3 267# if ($self->_storage->{links} > 1) {
1400a48e 268# $self->_throw_error("Cannot optimize: reference count is greater than 1");
d0b74c17 269# }
270
7a960a12 271 #XXX Do we have to lock the tempfile?
272
d0b74c17 273 my $db_temp = DBM::Deep->new(
83371fe3 274 file => $self->_storage->{file} . '.tmp',
d0b74c17 275 type => $self->_type
276 );
d0b74c17 277
278 $self->lock();
279 $self->_copy_node( $db_temp );
280 undef $db_temp;
281
282 ##
283 # Attempt to copy user, group and permissions over to new file
284 ##
285 my @stats = stat($self->_fh);
286 my $perms = $stats[2] & 07777;
287 my $uid = $stats[4];
288 my $gid = $stats[5];
83371fe3 289 chown( $uid, $gid, $self->_storage->{file} . '.tmp' );
290 chmod( $perms, $self->_storage->{file} . '.tmp' );
d0b74c17 291
ffed8b01 292 # q.v. perlport for more information on this variable
90f93b43 293 if ( $^O eq 'MSWin32' || $^O eq 'cygwin' ) {
d0b74c17 294 ##
295 # Potential race condition when optmizing on Win32 with locking.
296 # The Windows filesystem requires that the filehandle be closed
297 # before it is overwritten with rename(). This could be redone
298 # with a soft copy.
299 ##
300 $self->unlock();
83371fe3 301 $self->_storage->close;
d0b74c17 302 }
303
83371fe3 304 if (!rename $self->_storage->{file} . '.tmp', $self->_storage->{file}) {
305 unlink $self->_storage->{file} . '.tmp';
d0b74c17 306 $self->unlock();
1400a48e 307 $self->_throw_error("Optimize failed: Cannot copy temp file over original: $!");
d0b74c17 308 }
309
310 $self->unlock();
83371fe3 311 $self->_storage->close;
312 $self->_storage->open;
72e315ac 313 $self->_engine->setup_fh( $self );
70b55428 314
d0b74c17 315 return 1;
ffed8b01 316}
317
318sub clone {
d0b74c17 319 ##
320 # Make copy of object and return
321 ##
994ccd8e 322 my $self = shift->_get_self;
d0b74c17 323
324 return DBM::Deep->new(
c3aafc14 325 type => $self->_type,
d0b74c17 326 base_offset => $self->_base_offset,
83371fe3 327 storage => $self->_storage,
c9f02899 328 engine => $self->_engine,
d0b74c17 329 );
ffed8b01 330}
331
332{
333 my %is_legal_filter = map {
334 $_ => ~~1,
335 } qw(
336 store_key store_value
337 fetch_key fetch_value
338 );
339
340 sub set_filter {
341 ##
342 # Setup filter function for storing or fetching the key or value
343 ##
994ccd8e 344 my $self = shift->_get_self;
345 my $type = lc shift;
346 my $func = shift;
d0b74c17 347
ffed8b01 348 if ( $is_legal_filter{$type} ) {
83371fe3 349 $self->_storage->{"filter_$type"} = $func;
ffed8b01 350 return 1;
351 }
352
353 return;
354 }
355}
356
fee0243f 357sub begin_work {
358 my $self = shift->_get_self;
8cb9205a 359 return $self->_engine->begin_work( $self, @_ );
fee0243f 360}
361
362sub rollback {
363 my $self = shift->_get_self;
8cb9205a 364 return $self->_engine->rollback( $self, @_ );
fee0243f 365}
366
359a01ac 367sub commit {
368 my $self = shift->_get_self;
8cb9205a 369 return $self->_engine->commit( $self, @_ );
359a01ac 370}
fee0243f 371
ffed8b01 372##
373# Accessor methods
374##
375
72e315ac 376sub _engine {
377 my $self = $_[0]->_get_self;
378 return $self->{engine};
379}
380
83371fe3 381sub _storage {
2ac02042 382 my $self = $_[0]->_get_self;
83371fe3 383 return $self->{storage};
ffed8b01 384}
385
4d35d856 386sub _type {
2ac02042 387 my $self = $_[0]->_get_self;
d0b74c17 388 return $self->{type};
ffed8b01 389}
390
4d35d856 391sub _base_offset {
2ac02042 392 my $self = $_[0]->_get_self;
d0b74c17 393 return $self->{base_offset};
ffed8b01 394}
395
994ccd8e 396sub _fh {
994ccd8e 397 my $self = $_[0]->_get_self;
83371fe3 398 return $self->_storage->{fh};
994ccd8e 399}
400
ffed8b01 401##
402# Utility methods
403##
404
261d1296 405sub _throw_error {
95967a5e 406 die "DBM::Deep: $_[1]\n";
ffed8b01 407}
408
ffed8b01 409sub STORE {
d0b74c17 410 ##
411 # Store single hash key/value or array element in database.
412 ##
413 my $self = shift->_get_self;
359a01ac 414 my ($key, $value, $orig_key) = @_;
c3aafc14 415 $orig_key = $key unless defined $orig_key;
81d3d316 416
a8fdabda 417 if ( !FileHandle::Fmode::is_W( $self->_fh ) ) {
acd4faf2 418 $self->_throw_error( 'Cannot write to a readonly filehandle' );
419 }
d0b74c17 420
421 ##
422 # Request exclusive lock for writing
423 ##
424 $self->lock( LOCK_EX );
425
0cb639bd 426 # User may be storing a complex value, in which case we do not want it run
427 # through the filtering system.
83371fe3 428 if ( !ref($value) && $self->_storage->{filter_store_value} ) {
429 $value = $self->_storage->{filter_store_value}->( $value );
d0b74c17 430 }
431
c9f02899 432 $self->_engine->write_value( $self, $key, $value, $orig_key );
d0b74c17 433
434 $self->unlock();
435
86867f3a 436 return 1;
ffed8b01 437}
438
439sub FETCH {
d0b74c17 440 ##
441 # Fetch single value or element given plain key or array index
442 ##
cb79ec85 443 my $self = shift->_get_self;
a97c8f67 444 my ($key, $orig_key) = @_;
0cb639bd 445 $orig_key = $key unless defined $orig_key;
ffed8b01 446
d0b74c17 447 ##
448 # Request shared lock for reading
449 ##
450 $self->lock( LOCK_SH );
451
c9f02899 452 my $result = $self->_engine->read_value( $self, $key, $orig_key );
d0b74c17 453
454 $self->unlock();
455
a86430bd 456 # Filters only apply to scalar values, so the ref check is making
457 # sure the fetched bucket is a scalar, not a child hash or array.
83371fe3 458 return ($result && !ref($result) && $self->_storage->{filter_fetch_value})
459 ? $self->_storage->{filter_fetch_value}->($result)
cb79ec85 460 : $result;
ffed8b01 461}
462
463sub DELETE {
d0b74c17 464 ##
465 # Delete single key/value pair or element given plain key or array index
466 ##
a97c8f67 467 my $self = shift->_get_self;
468 my ($key, $orig_key) = @_;
c3aafc14 469 $orig_key = $key unless defined $orig_key;
d0b74c17 470
a8fdabda 471 if ( !FileHandle::Fmode::is_W( $self->_fh ) ) {
a86430bd 472 $self->_throw_error( 'Cannot write to a readonly filehandle' );
473 }
d0b74c17 474
475 ##
476 # Request exclusive lock for writing
477 ##
478 $self->lock( LOCK_EX );
479
d0b74c17 480 ##
481 # Delete bucket
482 ##
c9f02899 483 my $value = $self->_engine->delete_key( $self, $key, $orig_key );
a86430bd 484
83371fe3 485 if (defined $value && !ref($value) && $self->_storage->{filter_fetch_value}) {
486 $value = $self->_storage->{filter_fetch_value}->($value);
3b6a5056 487 }
488
d0b74c17 489 $self->unlock();
490
491 return $value;
ffed8b01 492}
493
494sub EXISTS {
d0b74c17 495 ##
496 # Check if a single key or element exists given plain key or array index
497 ##
a97c8f67 498 my $self = shift->_get_self;
499 my ($key) = @_;
d0b74c17 500
d0b74c17 501 ##
502 # Request shared lock for reading
503 ##
504 $self->lock( LOCK_SH );
505
c9f02899 506 my $result = $self->_engine->key_exists( $self, $key );
d0b74c17 507
508 $self->unlock();
509
510 return $result;
ffed8b01 511}
512
513sub CLEAR {
d0b74c17 514 ##
515 # Clear all keys from hash, or all elements from array.
516 ##
a97c8f67 517 my $self = shift->_get_self;
ffed8b01 518
a8fdabda 519 if ( !FileHandle::Fmode::is_W( $self->_fh ) ) {
a86430bd 520 $self->_throw_error( 'Cannot write to a readonly filehandle' );
521 }
522
d0b74c17 523 ##
524 # Request exclusive lock for writing
525 ##
526 $self->lock( LOCK_EX );
527
f9a320bb 528 if ( $self->_type eq TYPE_HASH ) {
529 my $key = $self->first_key;
530 while ( $key ) {
83c43bb5 531 # Retrieve the key before deleting because we depend on next_key
f9a320bb 532 my $next_key = $self->next_key( $key );
c9f02899 533 $self->_engine->delete_key( $self, $key, $key );
f9a320bb 534 $key = $next_key;
535 }
536 }
537 else {
538 my $size = $self->FETCHSIZE;
c3aafc14 539 for my $key ( 0 .. $size - 1 ) {
c9f02899 540 $self->_engine->delete_key( $self, $key, $key );
f9a320bb 541 }
542 $self->STORESIZE( 0 );
543 }
f9c33187 544#XXX This needs updating to use _release_space
f9a320bb 545# $self->_engine->write_tag(
546# $self->_base_offset, $self->_type,
547# chr(0)x$self->_engine->{index_size},
548# );
d0b74c17 549
550 $self->unlock();
551
552 return 1;
ffed8b01 553}
554
ffed8b01 555##
556# Public method aliases
557##
7f441181 558sub put { (shift)->STORE( @_ ) }
559sub store { (shift)->STORE( @_ ) }
560sub get { (shift)->FETCH( @_ ) }
561sub fetch { (shift)->FETCH( @_ ) }
baa27ab6 562sub delete { (shift)->DELETE( @_ ) }
563sub exists { (shift)->EXISTS( @_ ) }
564sub clear { (shift)->CLEAR( @_ ) }
ffed8b01 565
5661;
ffed8b01 567__END__
568
569=head1 NAME
570
571DBM::Deep - A pure perl multi-level hash/array DBM
572
573=head1 SYNOPSIS
574
575 use DBM::Deep;
576 my $db = DBM::Deep->new( "foo.db" );
d0b74c17 577
eff6a245 578 $db->{key} = 'value';
ffed8b01 579 print $db->{key};
d0b74c17 580
eff6a245 581 $db->put('key' => 'value');
ffed8b01 582 print $db->get('key');
d0b74c17 583
ffed8b01 584 # true multi-level support
585 $db->{my_complex} = [
d0b74c17 586 'hello', { perl => 'rules' },
587 42, 99,
90f93b43 588 ];
ffed8b01 589
eff6a245 590 tie my %db, 'DBM::Deep', 'foo.db';
591 $db{key} = 'value';
592 print $db{key};
ffed8b01 593
eff6a245 594 tied(%db)->put('key' => 'value');
595 print tied(%db)->get('key');
8db25060 596
eff6a245 597=head1 DESCRIPTION
8db25060 598
eff6a245 599A unique flat-file database module, written in pure perl. True multi-level
600hash/array support (unlike MLDBM, which is faked), hybrid OO / tie()
601interface, cross-platform FTPable files, ACID transactions, and is quite fast.
602Can handle millions of keys and unlimited levels without significant
603slow-down. Written from the ground-up in pure perl -- this is NOT a wrapper
604around a C-based DBM. Out-of-the-box compatibility with Unix, Mac OS X and
605Windows.
ffed8b01 606
eff6a245 607=head1 VERSION DIFFERENCES
ffed8b01 608
eff6a245 609B<NOTE>: 0.99_01 and above have significant file format differences from 0.983 and
610before. There will be a backwards-compatibility layer in 1.00, but that is
611slated for a later 0.99_x release. This version is B<NOT> backwards compatible
612with 0.983 and before.
ffed8b01 613
614=head1 SETUP
615
d0b74c17 616Construction can be done OO-style (which is the recommended way), or using
ffed8b01 617Perl's tie() function. Both are examined here.
618
619=head2 OO CONSTRUCTION
620
621The recommended way to construct a DBM::Deep object is to use the new()
eff6a245 622method, which gets you a blessed I<and> tied hash (or array) reference.
ffed8b01 623
a8fdabda 624 my $db = DBM::Deep->new( "foo.db" );
ffed8b01 625
626This opens a new database handle, mapped to the file "foo.db". If this
d0b74c17 627file does not exist, it will automatically be created. DB files are
ffed8b01 628opened in "r+" (read/write) mode, and the type of object returned is a
629hash, unless otherwise specified (see L<OPTIONS> below).
630
ffed8b01 631You can pass a number of options to the constructor to specify things like
eff6a245 632locking, autoflush, etc. This is done by passing an inline hash (or hashref):
ffed8b01 633
a8fdabda 634 my $db = DBM::Deep->new(
635 file => "foo.db",
636 locking => 1,
637 autoflush => 1
638 );
ffed8b01 639
640Notice that the filename is now specified I<inside> the hash with
d0b74c17 641the "file" parameter, as opposed to being the sole argument to the
ffed8b01 642constructor. This is required if any options are specified.
643See L<OPTIONS> below for the complete list.
644
ffed8b01 645You can also start with an array instead of a hash. For this, you must
646specify the C<type> parameter:
647
a8fdabda 648 my $db = DBM::Deep->new(
649 file => "foo.db",
650 type => DBM::Deep->TYPE_ARRAY
651 );
ffed8b01 652
653B<Note:> Specifing the C<type> parameter only takes effect when beginning
654a new DB file. If you create a DBM::Deep object with an existing file, the
90f93b43 655C<type> will be loaded from the file header, and an error will be thrown if
656the wrong type is passed in.
ffed8b01 657
658=head2 TIE CONSTRUCTION
659
90f93b43 660Alternately, you can create a DBM::Deep handle by using Perl's built-in
661tie() function. The object returned from tie() can be used to call methods,
eff6a245 662such as lock() and unlock(). (That object can be retrieved from the tied
663variable at any time using tied() - please see L<perltie/> for more info.
ffed8b01 664
a8fdabda 665 my %hash;
666 my $db = tie %hash, "DBM::Deep", "foo.db";
d0b74c17 667
a8fdabda 668 my @array;
669 my $db = tie @array, "DBM::Deep", "bar.db";
ffed8b01 670
671As with the OO constructor, you can replace the DB filename parameter with
672a hash containing one or more options (see L<OPTIONS> just below for the
673complete list).
674
a8fdabda 675 tie %hash, "DBM::Deep", {
676 file => "foo.db",
677 locking => 1,
678 autoflush => 1
679 };
ffed8b01 680
681=head2 OPTIONS
682
683There are a number of options that can be passed in when constructing your
684DBM::Deep objects. These apply to both the OO- and tie- based approaches.
685
686=over
687
688=item * file
689
690Filename of the DB file to link the handle to. You can pass a full absolute
d0b74c17 691filesystem path, partial path, or a plain filename if the file is in the
714618f0 692current working directory. This is a required parameter (though q.v. fh).
693
694=item * fh
695
696If you want, you can pass in the fh instead of the file. This is most useful for doing
697something like:
698
699 my $db = DBM::Deep->new( { fh => \*DATA } );
700
701You are responsible for making sure that the fh has been opened appropriately for your
702needs. If you open it read-only and attempt to write, an exception will be thrown. If you
703open it write-only or append-only, an exception will be thrown immediately as DBM::Deep
704needs to read from the fh.
705
706=item * file_offset
707
708This is the offset within the file that the DBM::Deep db starts. Most of the time, you will
709not need to set this. However, it's there if you want it.
710
711If you pass in fh and do not set this, it will be set appropriately.
ffed8b01 712
ffed8b01 713=item * type
714
715This parameter specifies what type of object to create, a hash or array. Use
359a01ac 716one of these two constants:
717
718=over 4
719
720=item * C<DBM::Deep-E<gt>TYPE_HASH>
721
722=item * C<DBM::Deep-E<gt>TYPE_ARRAY>.
723
724=back
725
d0b74c17 726This only takes effect when beginning a new file. This is an optional
ffed8b01 727parameter, and defaults to C<DBM::Deep-E<gt>TYPE_HASH>.
728
729=item * locking
730
eff6a245 731Specifies whether locking is to be enabled. DBM::Deep uses Perl's flock()
732function to lock the database in exclusive mode for writes, and shared mode
733for reads. Pass any true value to enable. This affects the base DB handle
734I<and any child hashes or arrays> that use the same DB file. This is an
735optional parameter, and defaults to 0 (disabled). See L<LOCKING> below for
736more.
ffed8b01 737
738=item * autoflush
739
d0b74c17 740Specifies whether autoflush is to be enabled on the underlying filehandle.
741This obviously slows down write operations, but is required if you may have
742multiple processes accessing the same DB file (also consider enable I<locking>).
743Pass any true value to enable. This is an optional parameter, and defaults to 0
ffed8b01 744(disabled).
745
746=item * autobless
747
359a01ac 748If I<autobless> mode is enabled, DBM::Deep will preserve the class something
749is blessed into, and restores it when fetched. This is an optional parameter, and defaults to 1 (enabled).
750
751B<Note:> If you use the OO-interface, you will not be able to call any methods
752of DBM::Deep on the blessed item. This is considered to be a feature.
ffed8b01 753
754=item * filter_*
755
359a01ac 756See L</FILTERS> below.
ffed8b01 757
ffed8b01 758=back
759
760=head1 TIE INTERFACE
761
762With DBM::Deep you can access your databases using Perl's standard hash/array
90f93b43 763syntax. Because all DBM::Deep objects are I<tied> to hashes or arrays, you can
764treat them as such. DBM::Deep will intercept all reads/writes and direct them
765to the right place -- the DB file. This has nothing to do with the
766L<TIE CONSTRUCTION> section above. This simply tells you how to use DBM::Deep
767using regular hashes and arrays, rather than calling functions like C<get()>
768and C<put()> (although those work too). It is entirely up to you how to want
769to access your databases.
ffed8b01 770
771=head2 HASHES
772
773You can treat any DBM::Deep object like a normal Perl hash reference. Add keys,
774or even nested hashes (or arrays) using standard Perl syntax:
775
a8fdabda 776 my $db = DBM::Deep->new( "foo.db" );
d0b74c17 777
a8fdabda 778 $db->{mykey} = "myvalue";
779 $db->{myhash} = {};
780 $db->{myhash}->{subkey} = "subvalue";
ffed8b01 781
a8fdabda 782 print $db->{myhash}->{subkey} . "\n";
ffed8b01 783
784You can even step through hash keys using the normal Perl C<keys()> function:
785
a8fdabda 786 foreach my $key (keys %$db) {
787 print "$key: " . $db->{$key} . "\n";
788 }
ffed8b01 789
790Remember that Perl's C<keys()> function extracts I<every> key from the hash and
d0b74c17 791pushes them onto an array, all before the loop even begins. If you have an
eff6a245 792extremely large hash, this may exhaust Perl's memory. Instead, consider using
d0b74c17 793Perl's C<each()> function, which pulls keys/values one at a time, using very
ffed8b01 794little memory:
795
a8fdabda 796 while (my ($key, $value) = each %$db) {
797 print "$key: $value\n";
798 }
ffed8b01 799
800Please note that when using C<each()>, you should always pass a direct
801hash reference, not a lookup. Meaning, you should B<never> do this:
802
a8fdabda 803 # NEVER DO THIS
804 while (my ($key, $value) = each %{$db->{foo}}) { # BAD
ffed8b01 805
806This causes an infinite loop, because for each iteration, Perl is calling
807FETCH() on the $db handle, resulting in a "new" hash for foo every time, so
d0b74c17 808it effectively keeps returning the first key over and over again. Instead,
ffed8b01 809assign a temporary variable to C<$db->{foo}>, then pass that to each().
810
811=head2 ARRAYS
812
813As with hashes, you can treat any DBM::Deep object like a normal Perl array
d0b74c17 814reference. This includes inserting, removing and manipulating elements,
ffed8b01 815and the C<push()>, C<pop()>, C<shift()>, C<unshift()> and C<splice()> functions.
d0b74c17 816The object must have first been created using type C<DBM::Deep-E<gt>TYPE_ARRAY>,
ffed8b01 817or simply be a nested array reference inside a hash. Example:
818
a8fdabda 819 my $db = DBM::Deep->new(
820 file => "foo-array.db",
821 type => DBM::Deep->TYPE_ARRAY
822 );
d0b74c17 823
a8fdabda 824 $db->[0] = "foo";
825 push @$db, "bar", "baz";
826 unshift @$db, "bah";
d0b74c17 827
a8fdabda 828 my $last_elem = pop @$db; # baz
829 my $first_elem = shift @$db; # bah
830 my $second_elem = $db->[1]; # bar
d0b74c17 831
a8fdabda 832 my $num_elements = scalar @$db;
ffed8b01 833
834=head1 OO INTERFACE
835
836In addition to the I<tie()> interface, you can also use a standard OO interface
837to manipulate all aspects of DBM::Deep databases. Each type of object (hash or
d0b74c17 838array) has its own methods, but both types share the following common methods:
eff6a245 839C<put()>, C<get()>, C<exists()>, C<delete()> and C<clear()>. C<fetch()> and
840C<store(> are aliases to C<put()> and C<get()>, respectively.
ffed8b01 841
842=over
843
4d35d856 844=item * new() / clone()
845
846These are the constructor and copy-functions.
847
90f93b43 848=item * put() / store()
ffed8b01 849
850Stores a new hash key/value pair, or sets an array element value. Takes two
851arguments, the hash key or array index, and the new value. The value can be
852a scalar, hash ref or array ref. Returns true on success, false on failure.
853
a8fdabda 854 $db->put("foo", "bar"); # for hashes
855 $db->put(1, "bar"); # for arrays
ffed8b01 856
90f93b43 857=item * get() / fetch()
ffed8b01 858
859Fetches the value of a hash key or array element. Takes one argument: the hash
d0b74c17 860key or array index. Returns a scalar, hash ref or array ref, depending on the
ffed8b01 861data type stored.
862
a8fdabda 863 my $value = $db->get("foo"); # for hashes
864 my $value = $db->get(1); # for arrays
ffed8b01 865
866=item * exists()
867
d0b74c17 868Checks if a hash key or array index exists. Takes one argument: the hash key
ffed8b01 869or array index. Returns true if it exists, false if not.
870
a8fdabda 871 if ($db->exists("foo")) { print "yay!\n"; } # for hashes
872 if ($db->exists(1)) { print "yay!\n"; } # for arrays
ffed8b01 873
874=item * delete()
875
876Deletes one hash key/value pair or array element. Takes one argument: the hash
877key or array index. Returns true on success, false if not found. For arrays,
878the remaining elements located after the deleted element are NOT moved over.
879The deleted element is essentially just undefined, which is exactly how Perl's
d0b74c17 880internal arrays work. Please note that the space occupied by the deleted
881key/value or element is B<not> reused again -- see L<UNUSED SPACE RECOVERY>
ffed8b01 882below for details and workarounds.
883
a8fdabda 884 $db->delete("foo"); # for hashes
885 $db->delete(1); # for arrays
ffed8b01 886
887=item * clear()
888
d0b74c17 889Deletes B<all> hash keys or array elements. Takes no arguments. No return
890value. Please note that the space occupied by the deleted keys/values or
891elements is B<not> reused again -- see L<UNUSED SPACE RECOVERY> below for
ffed8b01 892details and workarounds.
893
a8fdabda 894 $db->clear(); # hashes or arrays
ffed8b01 895
4d35d856 896=item * lock() / unlock()
897
898q.v. Locking.
899
900=item * optimize()
901
eff6a245 902Recover lost disk space. This is important to do, especially if you use
903transactions.
4d35d856 904
905=item * import() / export()
906
907Data going in and out.
908
ffed8b01 909=back
910
911=head2 HASHES
912
d0b74c17 913For hashes, DBM::Deep supports all the common methods described above, and the
ffed8b01 914following additional methods: C<first_key()> and C<next_key()>.
915
916=over
917
918=item * first_key()
919
d0b74c17 920Returns the "first" key in the hash. As with built-in Perl hashes, keys are
921fetched in an undefined order (which appears random). Takes no arguments,
ffed8b01 922returns the key as a scalar value.
923
a8fdabda 924 my $key = $db->first_key();
ffed8b01 925
926=item * next_key()
927
928Returns the "next" key in the hash, given the previous one as the sole argument.
929Returns undef if there are no more keys to be fetched.
930
a8fdabda 931 $key = $db->next_key($key);
ffed8b01 932
933=back
934
935Here are some examples of using hashes:
936
a8fdabda 937 my $db = DBM::Deep->new( "foo.db" );
d0b74c17 938
a8fdabda 939 $db->put("foo", "bar");
940 print "foo: " . $db->get("foo") . "\n";
d0b74c17 941
a8fdabda 942 $db->put("baz", {}); # new child hash ref
943 $db->get("baz")->put("buz", "biz");
944 print "buz: " . $db->get("baz")->get("buz") . "\n";
d0b74c17 945
a8fdabda 946 my $key = $db->first_key();
947 while ($key) {
948 print "$key: " . $db->get($key) . "\n";
949 $key = $db->next_key($key);
950 }
d0b74c17 951
a8fdabda 952 if ($db->exists("foo")) { $db->delete("foo"); }
ffed8b01 953
954=head2 ARRAYS
955
d0b74c17 956For arrays, DBM::Deep supports all the common methods described above, and the
957following additional methods: C<length()>, C<push()>, C<pop()>, C<shift()>,
ffed8b01 958C<unshift()> and C<splice()>.
959
960=over
961
962=item * length()
963
964Returns the number of elements in the array. Takes no arguments.
965
a8fdabda 966 my $len = $db->length();
ffed8b01 967
968=item * push()
969
d0b74c17 970Adds one or more elements onto the end of the array. Accepts scalars, hash
ffed8b01 971refs or array refs. No return value.
972
a8fdabda 973 $db->push("foo", "bar", {});
ffed8b01 974
975=item * pop()
976
977Fetches the last element in the array, and deletes it. Takes no arguments.
978Returns undef if array is empty. Returns the element value.
979
a8fdabda 980 my $elem = $db->pop();
ffed8b01 981
982=item * shift()
983
d0b74c17 984Fetches the first element in the array, deletes it, then shifts all the
985remaining elements over to take up the space. Returns the element value. This
986method is not recommended with large arrays -- see L<LARGE ARRAYS> below for
ffed8b01 987details.
988
a8fdabda 989 my $elem = $db->shift();
ffed8b01 990
991=item * unshift()
992
d0b74c17 993Inserts one or more elements onto the beginning of the array, shifting all
994existing elements over to make room. Accepts scalars, hash refs or array refs.
995No return value. This method is not recommended with large arrays -- see
ffed8b01 996<LARGE ARRAYS> below for details.
997
a8fdabda 998 $db->unshift("foo", "bar", {});
ffed8b01 999
1000=item * splice()
1001
d0b74c17 1002Performs exactly like Perl's built-in function of the same name. See L<perldoc
ffed8b01 1003-f splice> for usage -- it is too complicated to document here. This method is
1004not recommended with large arrays -- see L<LARGE ARRAYS> below for details.
1005
1006=back
1007
1008Here are some examples of using arrays:
1009
a8fdabda 1010 my $db = DBM::Deep->new(
1011 file => "foo.db",
1012 type => DBM::Deep->TYPE_ARRAY
1013 );
d0b74c17 1014
a8fdabda 1015 $db->push("bar", "baz");
1016 $db->unshift("foo");
1017 $db->put(3, "buz");
d0b74c17 1018
a8fdabda 1019 my $len = $db->length();
1020 print "length: $len\n"; # 4
d0b74c17 1021
a8fdabda 1022 for (my $k=0; $k<$len; $k++) {
1023 print "$k: " . $db->get($k) . "\n";
1024 }
d0b74c17 1025
a8fdabda 1026 $db->splice(1, 2, "biz", "baf");
d0b74c17 1027
a8fdabda 1028 while (my $elem = shift @$db) {
1029 print "shifted: $elem\n";
1030 }
ffed8b01 1031
1032=head1 LOCKING
1033
d0b74c17 1034Enable automatic file locking by passing a true value to the C<locking>
ffed8b01 1035parameter when constructing your DBM::Deep object (see L<SETUP> above).
1036
a8fdabda 1037 my $db = DBM::Deep->new(
1038 file => "foo.db",
1039 locking => 1
1040 );
ffed8b01 1041
d0b74c17 1042This causes DBM::Deep to C<flock()> the underlying filehandle with exclusive
1043mode for writes, and shared mode for reads. This is required if you have
1044multiple processes accessing the same database file, to avoid file corruption.
1045Please note that C<flock()> does NOT work for files over NFS. See L<DB OVER
ffed8b01 1046NFS> below for more.
1047
1048=head2 EXPLICIT LOCKING
1049
d0b74c17 1050You can explicitly lock a database, so it remains locked for multiple
1051transactions. This is done by calling the C<lock()> method, and passing an
90f93b43 1052optional lock mode argument (defaults to exclusive mode). This is particularly
d0b74c17 1053useful for things like counters, where the current value needs to be fetched,
ffed8b01 1054then incremented, then stored again.
1055
a8fdabda 1056 $db->lock();
1057 my $counter = $db->get("counter");
1058 $counter++;
1059 $db->put("counter", $counter);
1060 $db->unlock();
d0b74c17 1061
a8fdabda 1062 # or...
ffed8b01 1063
a8fdabda 1064 $db->lock();
1065 $db->{counter}++;
1066 $db->unlock();
ffed8b01 1067
1068You can pass C<lock()> an optional argument, which specifies which mode to use
68f943b3 1069(exclusive or shared). Use one of these two constants:
1070C<DBM::Deep-E<gt>LOCK_EX> or C<DBM::Deep-E<gt>LOCK_SH>. These are passed
1071directly to C<flock()>, and are the same as the constants defined in Perl's
1072L<Fcntl/> module.
ffed8b01 1073
a8fdabda 1074 $db->lock( $db->LOCK_SH );
1075 # something here
1076 $db->unlock();
ffed8b01 1077
ffed8b01 1078=head1 IMPORTING/EXPORTING
1079
1080You can import existing complex structures by calling the C<import()> method,
1081and export an entire database into an in-memory structure using the C<export()>
1082method. Both are examined here.
1083
1084=head2 IMPORTING
1085
1086Say you have an existing hash with nested hashes/arrays inside it. Instead of
d0b74c17 1087walking the structure and adding keys/elements to the database as you go,
1088simply pass a reference to the C<import()> method. This recursively adds
ffed8b01 1089everything to an existing DBM::Deep object for you. Here is an example:
1090
a8fdabda 1091 my $struct = {
1092 key1 => "value1",
1093 key2 => "value2",
1094 array1 => [ "elem0", "elem1", "elem2" ],
1095 hash1 => {
1096 subkey1 => "subvalue1",
1097 subkey2 => "subvalue2"
1098 }
1099 };
d0b74c17 1100
a8fdabda 1101 my $db = DBM::Deep->new( "foo.db" );
1102 $db->import( $struct );
d0b74c17 1103
a8fdabda 1104 print $db->{key1} . "\n"; # prints "value1"
d0b74c17 1105
1106This recursively imports the entire C<$struct> object into C<$db>, including
ffed8b01 1107all nested hashes and arrays. If the DBM::Deep object contains exsiting data,
d0b74c17 1108keys are merged with the existing ones, replacing if they already exist.
1109The C<import()> method can be called on any database level (not just the base
ffed8b01 1110level), and works with both hash and array DB types.
1111
ffed8b01 1112B<Note:> Make sure your existing structure has no circular references in it.
eff6a245 1113These will cause an infinite loop when importing. There are plans to fix this
1114in a later release.
ffed8b01 1115
1116=head2 EXPORTING
1117
d0b74c17 1118Calling the C<export()> method on an existing DBM::Deep object will return
1119a reference to a new in-memory copy of the database. The export is done
ffed8b01 1120recursively, so all nested hashes/arrays are all exported to standard Perl
1121objects. Here is an example:
1122
a8fdabda 1123 my $db = DBM::Deep->new( "foo.db" );
d0b74c17 1124
a8fdabda 1125 $db->{key1} = "value1";
1126 $db->{key2} = "value2";
1127 $db->{hash1} = {};
1128 $db->{hash1}->{subkey1} = "subvalue1";
1129 $db->{hash1}->{subkey2} = "subvalue2";
d0b74c17 1130
a8fdabda 1131 my $struct = $db->export();
d0b74c17 1132
a8fdabda 1133 print $struct->{key1} . "\n"; # prints "value1"
ffed8b01 1134
1135This makes a complete copy of the database in memory, and returns a reference
d0b74c17 1136to it. The C<export()> method can be called on any database level (not just
1137the base level), and works with both hash and array DB types. Be careful of
1138large databases -- you can store a lot more data in a DBM::Deep object than an
ffed8b01 1139in-memory Perl structure.
1140
ffed8b01 1141B<Note:> Make sure your database has no circular references in it.
eff6a245 1142These will cause an infinite loop when exporting. There are plans to fix this
1143in a later release.
ffed8b01 1144
1145=head1 FILTERS
1146
1147DBM::Deep has a number of hooks where you can specify your own Perl function
1148to perform filtering on incoming or outgoing data. This is a perfect
1149way to extend the engine, and implement things like real-time compression or
d0b74c17 1150encryption. Filtering applies to the base DB level, and all child hashes /
1151arrays. Filter hooks can be specified when your DBM::Deep object is first
1152constructed, or by calling the C<set_filter()> method at any time. There are
ffed8b01 1153four available filter hooks, described below:
1154
1155=over
1156
1157=item * filter_store_key
1158
d0b74c17 1159This filter is called whenever a hash key is stored. It
ffed8b01 1160is passed the incoming key, and expected to return a transformed key.
1161
1162=item * filter_store_value
1163
d0b74c17 1164This filter is called whenever a hash key or array element is stored. It
ffed8b01 1165is passed the incoming value, and expected to return a transformed value.
1166
1167=item * filter_fetch_key
1168
d0b74c17 1169This filter is called whenever a hash key is fetched (i.e. via
ffed8b01 1170C<first_key()> or C<next_key()>). It is passed the transformed key,
1171and expected to return the plain key.
1172
1173=item * filter_fetch_value
1174
d0b74c17 1175This filter is called whenever a hash key or array element is fetched.
ffed8b01 1176It is passed the transformed value, and expected to return the plain value.
1177
1178=back
1179
1180Here are the two ways to setup a filter hook:
1181
a8fdabda 1182 my $db = DBM::Deep->new(
1183 file => "foo.db",
1184 filter_store_value => \&my_filter_store,
1185 filter_fetch_value => \&my_filter_fetch
1186 );
d0b74c17 1187
a8fdabda 1188 # or...
d0b74c17 1189
a8fdabda 1190 $db->set_filter( "filter_store_value", \&my_filter_store );
1191 $db->set_filter( "filter_fetch_value", \&my_filter_fetch );
ffed8b01 1192
1193Your filter function will be called only when dealing with SCALAR keys or
1194values. When nested hashes and arrays are being stored/fetched, filtering
d0b74c17 1195is bypassed. Filters are called as static functions, passed a single SCALAR
ffed8b01 1196argument, and expected to return a single SCALAR value. If you want to
1197remove a filter, set the function reference to C<undef>:
1198
a8fdabda 1199 $db->set_filter( "filter_store_value", undef );
ffed8b01 1200
1201=head2 REAL-TIME ENCRYPTION EXAMPLE
1202
d0b74c17 1203Here is a working example that uses the I<Crypt::Blowfish> module to
ffed8b01 1204do real-time encryption / decryption of keys & values with DBM::Deep Filters.
d0b74c17 1205Please visit L<http://search.cpan.org/search?module=Crypt::Blowfish> for more
ffed8b01 1206on I<Crypt::Blowfish>. You'll also need the I<Crypt::CBC> module.
1207
a8fdabda 1208 use DBM::Deep;
1209 use Crypt::Blowfish;
1210 use Crypt::CBC;
1211
1212 my $cipher = Crypt::CBC->new({
1213 'key' => 'my secret key',
1214 'cipher' => 'Blowfish',
1215 'iv' => '$KJh#(}q',
1216 'regenerate_key' => 0,
1217 'padding' => 'space',
1218 'prepend_iv' => 0
1219 });
1220
1221 my $db = DBM::Deep->new(
1222 file => "foo-encrypt.db",
1223 filter_store_key => \&my_encrypt,
1224 filter_store_value => \&my_encrypt,
1225 filter_fetch_key => \&my_decrypt,
1226 filter_fetch_value => \&my_decrypt,
1227 );
1228
1229 $db->{key1} = "value1";
1230 $db->{key2} = "value2";
1231 print "key1: " . $db->{key1} . "\n";
1232 print "key2: " . $db->{key2} . "\n";
1233
1234 undef $db;
1235 exit;
1236
1237 sub my_encrypt {
1238 return $cipher->encrypt( $_[0] );
1239 }
1240 sub my_decrypt {
1241 return $cipher->decrypt( $_[0] );
1242 }
ffed8b01 1243
1244=head2 REAL-TIME COMPRESSION EXAMPLE
1245
1246Here is a working example that uses the I<Compress::Zlib> module to do real-time
1247compression / decompression of keys & values with DBM::Deep Filters.
d0b74c17 1248Please visit L<http://search.cpan.org/search?module=Compress::Zlib> for
ffed8b01 1249more on I<Compress::Zlib>.
1250
a8fdabda 1251 use DBM::Deep;
1252 use Compress::Zlib;
1253
1254 my $db = DBM::Deep->new(
1255 file => "foo-compress.db",
1256 filter_store_key => \&my_compress,
1257 filter_store_value => \&my_compress,
1258 filter_fetch_key => \&my_decompress,
1259 filter_fetch_value => \&my_decompress,
1260 );
1261
1262 $db->{key1} = "value1";
1263 $db->{key2} = "value2";
1264 print "key1: " . $db->{key1} . "\n";
1265 print "key2: " . $db->{key2} . "\n";
1266
1267 undef $db;
1268 exit;
1269
1270 sub my_compress {
1271 return Compress::Zlib::memGzip( $_[0] ) ;
1272 }
1273 sub my_decompress {
1274 return Compress::Zlib::memGunzip( $_[0] ) ;
1275 }
ffed8b01 1276
1277B<Note:> Filtering of keys only applies to hashes. Array "keys" are
1278actually numerical index numbers, and are not filtered.
1279
1280=head1 ERROR HANDLING
1281
1282Most DBM::Deep methods return a true value for success, and call die() on
95967a5e 1283failure. You can wrap calls in an eval block to catch the die.
ffed8b01 1284
a8fdabda 1285 my $db = DBM::Deep->new( "foo.db" ); # create hash
1286 eval { $db->push("foo"); }; # ILLEGAL -- push is array-only call
d0b74c17 1287
a8fdabda 1288 print $@; # prints error message
429e4192 1289
ffed8b01 1290=head1 LARGEFILE SUPPORT
1291
1292If you have a 64-bit system, and your Perl is compiled with both LARGEFILE
1293and 64-bit support, you I<may> be able to create databases larger than 2 GB.
1294DBM::Deep by default uses 32-bit file offset tags, but these can be changed
044e6288 1295by specifying the 'pack_size' parameter when constructing the file.
ffed8b01 1296
a8fdabda 1297 DBM::Deep->new(
1298 filename => $filename,
1299 pack_size => 'large',
1300 );
ffed8b01 1301
d0b74c17 1302This tells DBM::Deep to pack all file offsets with 8-byte (64-bit) quad words
1303instead of 32-bit longs. After setting these values your DB files have a
ffed8b01 1304theoretical maximum size of 16 XB (exabytes).
1305
044e6288 1306You can also use C<pack_size =E<gt> 'small'> in order to use 16-bit file
1307offsets.
1308
ffed8b01 1309B<Note:> Changing these values will B<NOT> work for existing database files.
044e6288 1310Only change this for new files. Once the value has been set, it is stored in
1311the file's header and cannot be changed for the life of the file. These
1312parameters are per-file, meaning you can access 32-bit and 64-bit files, as
1313you chose.
ffed8b01 1314
044e6288 1315B<Note:> We have not personally tested files larger than 2 GB -- all my
1316systems have only a 32-bit Perl. However, I have received user reports that
1317this does indeed work!
ffed8b01 1318
1319=head1 LOW-LEVEL ACCESS
1320
90f93b43 1321If you require low-level access to the underlying filehandle that DBM::Deep uses,
4d35d856 1322you can call the C<_fh()> method, which returns the handle:
ffed8b01 1323
a8fdabda 1324 my $fh = $db->_fh();
ffed8b01 1325
1326This method can be called on the root level of the datbase, or any child
1327hashes or arrays. All levels share a I<root> structure, which contains things
90f93b43 1328like the filehandle, a reference counter, and all the options specified
460b1067 1329when you created the object. You can get access to this file object by
83371fe3 1330calling the C<_storage()> method.
ffed8b01 1331
83371fe3 1332 my $file_obj = $db->_storage();
ffed8b01 1333
1334This is useful for changing options after the object has already been created,
f5be9b03 1335such as enabling/disabling locking. You can also store your own temporary user
1336data in this structure (be wary of name collision), which is then accessible from
1337any child hash or array.
ffed8b01 1338
1339=head1 CUSTOM DIGEST ALGORITHM
1340
1341DBM::Deep by default uses the I<Message Digest 5> (MD5) algorithm for hashing
1342keys. However you can override this, and use another algorithm (such as SHA-256)
d0b74c17 1343or even write your own. But please note that DBM::Deep currently expects zero
044e6288 1344collisions, so your algorithm has to be I<perfect>, so to speak. Collision
1345detection may be introduced in a later version.
ffed8b01 1346
044e6288 1347You can specify a custom digest algorithm by passing it into the parameter
1348list for new(), passing a reference to a subroutine as the 'digest' parameter,
1349and the length of the algorithm's hashes (in bytes) as the 'hash_size'
1350parameter. Here is a working example that uses a 256-bit hash from the
d0b74c17 1351I<Digest::SHA256> module. Please see
044e6288 1352L<http://search.cpan.org/search?module=Digest::SHA256> for more information.
ffed8b01 1353
a8fdabda 1354 use DBM::Deep;
1355 use Digest::SHA256;
d0b74c17 1356
a8fdabda 1357 my $context = Digest::SHA256::new(256);
d0b74c17 1358
a8fdabda 1359 my $db = DBM::Deep->new(
1360 filename => "foo-sha.db",
1361 digest => \&my_digest,
1362 hash_size => 32,
1363 );
d0b74c17 1364
a8fdabda 1365 $db->{key1} = "value1";
1366 $db->{key2} = "value2";
1367 print "key1: " . $db->{key1} . "\n";
1368 print "key2: " . $db->{key2} . "\n";
d0b74c17 1369
a8fdabda 1370 undef $db;
1371 exit;
d0b74c17 1372
a8fdabda 1373 sub my_digest {
1374 return substr( $context->hash($_[0]), 0, 32 );
1375 }
ffed8b01 1376
1377B<Note:> Your returned digest strings must be B<EXACTLY> the number
044e6288 1378of bytes you specify in the hash_size parameter (in this case 32).
ffed8b01 1379
260a80b4 1380B<Note:> If you do choose to use a custom digest algorithm, you must set it
1381every time you access this file. Otherwise, the default (MD5) will be used.
1382
ffed8b01 1383=head1 CIRCULAR REFERENCES
1384
1385DBM::Deep has B<experimental> support for circular references. Meaning you
1386can have a nested hash key or array element that points to a parent object.
1387This relationship is stored in the DB file, and is preserved between sessions.
1388Here is an example:
1389
a8fdabda 1390 my $db = DBM::Deep->new( "foo.db" );
d0b74c17 1391
a8fdabda 1392 $db->{foo} = "bar";
1393 $db->{circle} = $db; # ref to self
d0b74c17 1394
a8fdabda 1395 print $db->{foo} . "\n"; # prints "bar"
1396 print $db->{circle}->{foo} . "\n"; # prints "bar" again
ffed8b01 1397
69c94980 1398B<Note>: Passing the object to a function that recursively walks the
ffed8b01 1399object tree (such as I<Data::Dumper> or even the built-in C<optimize()> or
69c94980 1400C<export()> methods) will result in an infinite loop. This will be fixed in
1401a future release.
ffed8b01 1402
eff6a245 1403=head1 TRANSACTIONS
1404
1405New in 0.99_01 is ACID transactions. Every DBM::Deep object is completely
1406transaction-ready - it is not an option you have to turn on. Three new methods
1407have been added to support them. They are:
1408
1409=over 4
1410
1411=item * begin_work()
1412
1413This starts a transaction.
1414
1415=item * commit()
1416
1417This applies the changes done within the transaction to the mainline and ends
1418the transaction.
1419
1420=item * rollback()
1421
1422This discards the changes done within the transaction to the mainline and ends
1423the transaction.
1424
1425=back
1426
1427Transactions in DBM::Deep are done using the MVCC method, the same method used
1428by the InnoDB MySQL table type.
1429
ffed8b01 1430=head1 CAVEATS / ISSUES / BUGS
1431
1432This section describes all the known issues with DBM::Deep. It you have found
1433something that is not listed here, please send e-mail to L<jhuckaby@cpan.org>.
1434
1435=head2 UNUSED SPACE RECOVERY
1436
14a3acb6 1437One major caveat with DBM::Deep is that space occupied by existing keys and
ffed8b01 1438values is not recovered when they are deleted. Meaning if you keep deleting
1439and adding new keys, your file will continuously grow. I am working on this,
d0b74c17 1440but in the meantime you can call the built-in C<optimize()> method from time to
ffed8b01 1441time (perhaps in a crontab or something) to recover all your unused space.
1442
a8fdabda 1443 $db->optimize(); # returns true on success
ffed8b01 1444
1445This rebuilds the ENTIRE database into a new file, then moves it on top of
1446the original. The new file will have no unused space, thus it will take up as
d0b74c17 1447little disk space as possible. Please note that this operation can take
1448a long time for large files, and you need enough disk space to temporarily hold
14492 copies of your DB file. The temporary file is created in the same directory
1450as the original, named with a ".tmp" extension, and is deleted when the
1451operation completes. Oh, and if locking is enabled, the DB is automatically
ffed8b01 1452locked for the entire duration of the copy.
1453
d0b74c17 1454B<WARNING:> Only call optimize() on the top-level node of the database, and
1455make sure there are no child references lying around. DBM::Deep keeps a reference
ffed8b01 1456counter, and if it is greater than 1, optimize() will abort and return undef.
1457
eea0d863 1458=head2 REFERENCES
1459
1460(The reasons given assume a high level of Perl understanding, specifically of
1461references. You can safely skip this section.)
1462
1463Currently, the only references supported are HASH and ARRAY. The other reference
1464types (SCALAR, CODE, GLOB, and REF) cannot be supported for various reasons.
1465
1466=over 4
1467
1468=item * GLOB
1469
1470These are things like filehandles and other sockets. They can't be supported
1471because it's completely unclear how DBM::Deep should serialize them.
1472
1473=item * SCALAR / REF
1474
1475The discussion here refers to the following type of example:
1476
1477 my $x = 25;
1478 $db->{key1} = \$x;
1479
1480 $x = 50;
1481
1482 # In some other process ...
1483
1484 my $val = ${ $db->{key1} };
1485
1486 is( $val, 50, "What actually gets stored in the DB file?" );
1487
1488The problem is one of synchronization. When the variable being referred to
1489changes value, the reference isn't notified. This means that the new value won't
1490be stored in the datafile for other processes to read. There is no TIEREF.
1491
1492It is theoretically possible to store references to values already within a
1493DBM::Deep object because everything already is synchronized, but the change to
1494the internals would be quite large. Specifically, DBM::Deep would have to tie
1495every single value that is stored. This would bloat the RAM footprint of
1496DBM::Deep at least twofold (if not more) and be a significant performance drain,
1497all to support a feature that has never been requested.
1498
1499=item * CODE
1500
1990c72d 1501L<Data::Dump::Streamer/> provides a mechanism for serializing coderefs,
1502including saving off all closure state. However, just as for SCALAR and REF,
1503that closure state may change without notifying the DBM::Deep object storing
1504the reference.
eea0d863 1505
1506=back
1507
ffed8b01 1508=head2 FILE CORRUPTION
1509
14a3acb6 1510The current level of error handling in DBM::Deep is minimal. Files I<are> checked
1511for a 32-bit signature when opened, but other corruption in files can cause
1512segmentation faults. DBM::Deep may try to seek() past the end of a file, or get
ffed8b01 1513stuck in an infinite loop depending on the level of corruption. File write
1514operations are not checked for failure (for speed), so if you happen to run
d0b74c17 1515out of disk space, DBM::Deep will probably fail in a bad way. These things will
ffed8b01 1516be addressed in a later version of DBM::Deep.
1517
1518=head2 DB OVER NFS
1519
d8db2929 1520Beware of using DBM::Deep files over NFS. DBM::Deep uses flock(), which works
1521well on local filesystems, but will NOT protect you from file corruption over
1522NFS. I've heard about setting up your NFS server with a locking daemon, then
1523using lockf() to lock your files, but your mileage may vary there as well.
1524From what I understand, there is no real way to do it. However, if you need
1525access to the underlying filehandle in DBM::Deep for using some other kind of
1526locking scheme like lockf(), see the L<LOW-LEVEL ACCESS> section above.
ffed8b01 1527
1528=head2 COPYING OBJECTS
1529
d0b74c17 1530Beware of copying tied objects in Perl. Very strange things can happen.
1531Instead, use DBM::Deep's C<clone()> method which safely copies the object and
ffed8b01 1532returns a new, blessed, tied hash or array to the same level in the DB.
1533
a8fdabda 1534 my $copy = $db->clone();
ffed8b01 1535
90f93b43 1536B<Note>: Since clone() here is cloning the object, not the database location, any
d8db2929 1537modifications to either $db or $copy will be visible to both.
90f93b43 1538
ffed8b01 1539=head2 LARGE ARRAYS
1540
1541Beware of using C<shift()>, C<unshift()> or C<splice()> with large arrays.
1542These functions cause every element in the array to move, which can be murder
1543on DBM::Deep, as every element has to be fetched from disk, then stored again in
90f93b43 1544a different location. This will be addressed in the forthcoming version 1.00.
ffed8b01 1545
9be51a89 1546=head2 WRITEONLY FILES
1547
1548If you pass in a filehandle to new(), you may have opened it in either a readonly or
1549writeonly mode. STORE will verify that the filehandle is writable. However, there
1550doesn't seem to be a good way to determine if a filehandle is readable. And, if the
1551filehandle isn't readable, it's not clear what will happen. So, don't do that.
1552
261d1296 1553=head1 CODE COVERAGE
1554
eff6a245 1555B<Devel::Cover> is used to test the code coverage of the tests. Below is the
1556B<Devel::Cover> report on this distribution's test suite.
7910cf68 1557
eff6a245 1558 ---------------------------- ------ ------ ------ ------ ------ ------ ------
1559 File stmt bran cond sub pod time total
1560 ---------------------------- ------ ------ ------ ------ ------ ------ ------
1561 blib/lib/DBM/Deep.pm 96.2 89.0 75.0 95.8 89.5 36.0 92.9
1562 blib/lib/DBM/Deep/Array.pm 96.1 88.3 100.0 96.4 100.0 15.9 94.7
1563 blib/lib/DBM/Deep/Engine.pm 96.6 86.6 89.5 100.0 0.0 20.0 91.0
1564 blib/lib/DBM/Deep/File.pm 99.4 88.3 55.6 100.0 0.0 19.6 89.5
1565 blib/lib/DBM/Deep/Hash.pm 98.5 83.3 100.0 100.0 100.0 8.5 96.3
1566 Total 96.9 87.4 81.2 98.0 38.5 100.0 92.1
1567 ---------------------------- ------ ------ ------ ------ ------ ------ ------
37c5bcf0 1568
1569=head1 MORE INFORMATION
1570
1571Check out the DBM::Deep Google Group at L<http://groups.google.com/group/DBM-Deep>
eff6a245 1572or send email to L<DBM-Deep@googlegroups.com>. You can also visit #dbm-deep on
1573irc.perl.org
ffed8b01 1574
d8db2929 1575The source code repository is at L<http://svn.perl.org/modules/DBM-Deep>
1576
eff6a245 1577=head1 MAINTAINERS
37c5bcf0 1578
aeeb5497 1579Rob Kinyon, L<rkinyon@cpan.org>
ffed8b01 1580
eff6a245 1581Originally written by Joseph Huckaby, L<jhuckaby@cpan.org>
1582
ffed8b01 1583Special thanks to Adam Sah and Rich Gaushell! You know why :-)
1584
1585=head1 SEE ALSO
1586
1587perltie(1), Tie::Hash(3), Digest::MD5(3), Fcntl(3), flock(2), lockf(3), nfs(5),
1588Digest::SHA256(3), Crypt::Blowfish(3), Compress::Zlib(3)
1589
1590=head1 LICENSE
1591
aeeb5497 1592Copyright (c) 2002-2006 Joseph Huckaby. All Rights Reserved.
ffed8b01 1593This is free software, you may use it and distribute it under the
1594same terms as Perl itself.
1595
1596=cut