ext/DB_File/DB_File.pm

   1 # DB_File.pm -- Perl 5 interface to Berkeley DB
   2 #
   3 # written by Paul Marquess (Paul.Marquess@btinternet.com)
   4 # last modified 1st March 2002
   5 # version 1.804
   6 #
   7 #     Copyright (c) 1995-2002 Paul Marquess. All rights reserved.
   8 #     This program is free software; you can redistribute it and/or
   9 #     modify it under the same terms as Perl itself.
  10
  11
  12 package DB_File::HASHINFO ;
  13
  14 require 5.00404;
  15
  16 use warnings;
  17 use strict;
  18 use Carp;
  19 require Tie::Hash;
  20 @DB_File::HASHINFO::ISA = qw(Tie::Hash);
  21
  22 sub new
  23 {
  24     my $pkg = shift ;
  25     my %x ;
  26     tie %x, $pkg ;
  27     bless \%x, $pkg ;
  28 }
  29
  30
  31 sub TIEHASH
  32 {
  33     my $pkg = shift ;
  34
  35     bless { VALID => { map {$_, 1}
  36                        qw( bsize ffactor nelem cachesize hash lorder)
  37                      },
  38             GOT   => {}
  39           }, $pkg ;
  40 }
  41
  42
  43 sub FETCH
  44 {
  45     my $self  = shift ;
  46     my $key   = shift ;
  47
  48     return $self->{GOT}{$key} if exists $self->{VALID}{$key}  ;
  49
  50     my $pkg = ref $self ;
  51     croak "${pkg}::FETCH - Unknown element '$key'" ;
  52 }
  53
  54
  55 sub STORE
  56 {
  57     my $self  = shift ;
  58     my $key   = shift ;
  59     my $value = shift ;
  60
  61     if ( exists $self->{VALID}{$key} )
  62     {
  63         $self->{GOT}{$key} = $value ;
  64         return ;
  65     }
  66
  67     my $pkg = ref $self ;
  68     croak "${pkg}::STORE - Unknown element '$key'" ;
  69 }
  70
  71 sub DELETE
  72 {
  73     my $self = shift ;
  74     my $key  = shift ;
  75
  76     if ( exists $self->{VALID}{$key} )
  77     {
  78         delete $self->{GOT}{$key} ;
  79         return ;
  80     }
  81
  82     my $pkg = ref $self ;
  83     croak "DB_File::HASHINFO::DELETE - Unknown element '$key'" ;
  84 }
  85
  86 sub EXISTS
  87 {
  88     my $self = shift ;
  89     my $key  = shift ;
  90
  91     exists $self->{VALID}{$key} ;
  92 }
  93
  94 sub NotHere
  95 {
  96     my $self = shift ;
  97     my $method = shift ;
  98
  99     croak ref($self) . " does not define the method ${method}" ;
 100 }
 101
 102 sub FIRSTKEY { my $self = shift ; $self->NotHere("FIRSTKEY") }
 103 sub NEXTKEY  { my $self = shift ; $self->NotHere("NEXTKEY") }
 104 sub CLEAR    { my $self = shift ; $self->NotHere("CLEAR") }
 105
 106 package DB_File::RECNOINFO ;
 107
 108 use warnings;
 109 use strict ;
 110
 111 @DB_File::RECNOINFO::ISA = qw(DB_File::HASHINFO) ;
 112
 113 sub TIEHASH
 114 {
 115     my $pkg = shift ;
 116
 117     bless { VALID => { map {$_, 1}
 118                        qw( bval cachesize psize flags lorder reclen bfname )
 119                      },
 120             GOT   => {},
 121           }, $pkg ;
 122 }
 123
 124 package DB_File::BTREEINFO ;
 125
 126 use warnings;
 127 use strict ;
 128
 129 @DB_File::BTREEINFO::ISA = qw(DB_File::HASHINFO) ;
 130
 131 sub TIEHASH
 132 {
 133     my $pkg = shift ;
 134
 135     bless { VALID => { map {$_, 1}
 136                        qw( flags cachesize maxkeypage minkeypage psize
 137                            compare prefix lorder )
 138                      },
 139             GOT   => {},
 140           }, $pkg ;
 141 }
 142
 143
 144 package DB_File ;
 145
 146 use warnings;
 147 use strict;
 148 our ($VERSION, @ISA, @EXPORT, $AUTOLOAD, $DB_BTREE, $DB_HASH, $DB_RECNO);
 149 our ($db_version, $use_XSLoader, $splice_end_array);
 150 use Carp;
 151
 152
 153 $VERSION = "1.804" ;
 154
 155 {
 156     local $SIG{__WARN__} = sub {$splice_end_array = "@_";};
 157     my @a =(1); splice(@a, 3);
 158     $splice_end_array =
 159         ($splice_end_array =~ /^splice\(\) offset past end of array at /);
 160 }
 161
 162 #typedef enum { DB_BTREE, DB_HASH, DB_RECNO } DBTYPE;
 163 $DB_BTREE = new DB_File::BTREEINFO ;
 164 $DB_HASH  = new DB_File::HASHINFO ;
 165 $DB_RECNO = new DB_File::RECNOINFO ;
 166
 167 require Tie::Hash;
 168 require Exporter;
 169 use AutoLoader;
 170 BEGIN {
 171     $use_XSLoader = 1 ;
 172     { local $SIG{__DIE__} ; eval { require XSLoader } ; }
 173
 174     if ($@) {
 175         $use_XSLoader = 0 ;
 176         require DynaLoader;
 177         @ISA = qw(DynaLoader);
 178     }
 179 }
 180
 181 push @ISA, qw(Tie::Hash Exporter);
 182 @EXPORT = qw(
 183         $DB_BTREE $DB_HASH $DB_RECNO
 184
 185         BTREEMAGIC
 186         BTREEVERSION
 187         DB_LOCK
 188         DB_SHMEM
 189         DB_TXN
 190         HASHMAGIC
 191         HASHVERSION
 192         MAX_PAGE_NUMBER
 193         MAX_PAGE_OFFSET
 194         MAX_REC_NUMBER
 195         RET_ERROR
 196         RET_SPECIAL
 197         RET_SUCCESS
 198         R_CURSOR
 199         R_DUP
 200         R_FIRST
 201         R_FIXEDLEN
 202         R_IAFTER
 203         R_IBEFORE
 204         R_LAST
 205         R_NEXT
 206         R_NOKEY
 207         R_NOOVERWRITE
 208         R_PREV
 209         R_RECNOSYNC
 210         R_SETCURSOR
 211         R_SNAPSHOT
 212         __R_UNUSED
 213
 214 );
 215
 216 sub AUTOLOAD {
 217     my($constname);
 218     ($constname = $AUTOLOAD) =~ s/.*:://;
 219     my ($error, $val) = constant($constname);
 220     Carp::croak $error if $error;
 221     no strict 'refs';
 222     *{$AUTOLOAD} = sub { $val };
 223     goto &{$AUTOLOAD};
 224 }
 225
 226
 227 eval {
 228     # Make all Fcntl O_XXX constants available for importing
 229     require Fcntl;
 230     my @O = grep /^O_/, @Fcntl::EXPORT;
 231     Fcntl->import(@O);  # first we import what we want to export
 232     push(@EXPORT, @O);
 233 };
 234
 235 if ($use_XSLoader)
 236   { XSLoader::load("DB_File", $VERSION)}
 237 else
 238   { bootstrap DB_File $VERSION }
 239
 240 # Preloaded methods go here.  Autoload methods go after __END__, and are
 241 # processed by the autosplit program.
 242
 243 sub tie_hash_or_array
 244 {
 245     my (@arg) = @_ ;
 246     my $tieHASH = ( (caller(1))[3] =~ /TIEHASH/ ) ;
 247
 248     $arg[4] = tied %{ $arg[4] }
 249         if @arg >= 5 && ref $arg[4] && $arg[4] =~ /=HASH/ && tied %{ $arg[4] } ;
 250
 251     # make recno in Berkeley DB version 2 work like recno in version 1.
 252     if ($db_version > 1 and defined $arg[4] and $arg[4] =~ /RECNO/ and
 253         $arg[1] and ! -e $arg[1]) {
 254         open(FH, ">$arg[1]") or return undef ;
 255         close FH ;
 256         chmod $arg[3] ? $arg[3] : 0666 , $arg[1] ;
 257     }
 258
 259     DoTie_($tieHASH, @arg) ;
 260 }
 261
 262 sub TIEHASH
 263 {
 264     tie_hash_or_array(@_) ;
 265 }
 266
 267 sub TIEARRAY
 268 {
 269     tie_hash_or_array(@_) ;
 270 }
 271
 272 sub CLEAR
 273 {
 274     my $self = shift;
 275     my $key = 0 ;
 276     my $value = "" ;
 277     my $status = $self->seq($key, $value, R_FIRST());
 278     my @keys;
 279
 280     while ($status == 0) {
 281         push @keys, $key;
 282         $status = $self->seq($key, $value, R_NEXT());
 283     }
 284     foreach $key (reverse @keys) {
 285         my $s = $self->del($key);
 286     }
 287 }
 288
 289 sub EXTEND { }
 290
 291 sub STORESIZE
 292 {
 293     my $self = shift;
 294     my $length = shift ;
 295     my $current_length = $self->length() ;
 296
 297     if ($length < $current_length) {
 298         my $key ;
 299         for ($key = $current_length - 1 ; $key >= $length ; -- $key)
 300           { $self->del($key) }
 301     }
 302     elsif ($length > $current_length) {
 303         $self->put($length-1, "") ;
 304     }
 305 }
 306
 307
 308 sub SPLICE
 309 {
 310     my $self = shift;
 311     my $offset = shift;
 312     if (not defined $offset) {
 313         warnings::warnif('uninitialized', 'Use of uninitialized value in splice');
 314         $offset = 0;
 315     }
 316
 317     my $length = @_ ? shift : 0;
 318     # Carping about definedness comes _after_ the OFFSET sanity check.
 319     # This is so we get the same error messages as Perl's splice().
 320     #
 321
 322     my @list = @_;
 323
 324     my $size = $self->FETCHSIZE();
 325
 326     # 'If OFFSET is negative then it start that far from the end of
 327     # the array.'
 328     #
 329     if ($offset < 0) {
 330         my $new_offset = $size + $offset;
 331         if ($new_offset < 0) {
 332             die "Modification of non-creatable array value attempted, "
 333               . "subscript $offset";
 334         }
 335         $offset = $new_offset;
 336     }
 337
 338     if (not defined $length) {
 339         warnings::warnif('uninitialized', 'Use of uninitialized value in splice');
 340         $length = 0;
 341     }
 342
 343     if ($offset > $size) {
 344         $offset = $size;
 345         warnings::warnif('misc', 'splice() offset past end of array')
 346             if $splice_end_array;
 347     }
 348
 349     # 'If LENGTH is omitted, removes everything from OFFSET onward.'
 350     if (not defined $length) {
 351         $length = $size - $offset;
 352     }
 353
 354     # 'If LENGTH is negative, leave that many elements off the end of
 355     # the array.'
 356     #
 357     if ($length < 0) {
 358         $length = $size - $offset + $length;
 359
 360         if ($length < 0) {
 361             # The user must have specified a length bigger than the
 362             # length of the array passed in.  But perl's splice()
 363             # doesn't catch this, it just behaves as for length=0.
 364             #
 365             $length = 0;
 366         }
 367     }
 368
 369     if ($length > $size - $offset) {
 370         $length = $size - $offset;
 371     }
 372
 373     # $num_elems holds the current number of elements in the database.
 374     my $num_elems = $size;
 375
 376     # 'Removes the elements designated by OFFSET and LENGTH from an
 377     # array,'...
 378     #
 379     my @removed = ();
 380     foreach (0 .. $length - 1) {
 381         my $old;
 382         my $status = $self->get($offset, $old);
 383         if ($status != 0) {
 384             my $msg = "error from Berkeley DB on get($offset, \$old)";
 385             if ($status == 1) {
 386                 $msg .= ' (no such element?)';
 387             }
 388             else {
 389                 $msg .= ": error status $status";
 390                 if (defined $! and $! ne '') {
 391                     $msg .= ", message $!";
 392                 }
 393             }
 394             die $msg;
 395         }
 396         push @removed, $old;
 397
 398         $status = $self->del($offset);
 399         if ($status != 0) {
 400             my $msg = "error from Berkeley DB on del($offset)";
 401             if ($status == 1) {
 402                 $msg .= ' (no such element?)';
 403             }
 404             else {
 405                 $msg .= ": error status $status";
 406                 if (defined $! and $! ne '') {
 407                     $msg .= ", message $!";
 408                 }
 409             }
 410             die $msg;
 411         }
 412
 413         -- $num_elems;
 414     }
 415
 416     # ...'and replaces them with the elements of LIST, if any.'
 417     my $pos = $offset;
 418     while (defined (my $elem = shift @list)) {
 419         my $old_pos = $pos;
 420         my $status;
 421         if ($pos >= $num_elems) {
 422             $status = $self->put($pos, $elem);
 423         }
 424         else {
 425             $status = $self->put($pos, $elem, $self->R_IBEFORE);
 426         }
 427
 428         if ($status != 0) {
 429             my $msg = "error from Berkeley DB on put($pos, $elem, ...)";
 430             if ($status == 1) {
 431                 $msg .= ' (no such element?)';
 432             }
 433             else {
 434                 $msg .= ", error status $status";
 435                 if (defined $! and $! ne '') {
 436                     $msg .= ", message $!";
 437                 }
 438             }
 439             die $msg;
 440         }
 441
 442         die "pos unexpectedly changed from $old_pos to $pos with R_IBEFORE"
 443           if $old_pos != $pos;
 444
 445         ++ $pos;
 446         ++ $num_elems;
 447     }
 448
 449     if (wantarray) {
 450         # 'In list context, returns the elements removed from the
 451         # array.'
 452         #
 453         return @removed;
 454     }
 455     elsif (defined wantarray and not wantarray) {
 456         # 'In scalar context, returns the last element removed, or
 457         # undef if no elements are removed.'
 458         #
 459         if (@removed) {
 460             my $last = pop @removed;
 461             return "$last";
 462         }
 463         else {
 464             return undef;
 465         }
 466     }
 467     elsif (not defined wantarray) {
 468         # Void context
 469     }
 470     else { die }
 471 }
 472 sub ::DB_File::splice { &SPLICE }
 473
 474 sub find_dup
 475 {
 476     croak "Usage: \$db->find_dup(key,value)\n"
 477         unless @_ == 3 ;
 478
 479     my $db        = shift ;
 480     my ($origkey, $value_wanted) = @_ ;
 481     my ($key, $value) = ($origkey, 0);
 482     my ($status) = 0 ;
 483
 484     for ($status = $db->seq($key, $value, R_CURSOR() ) ;
 485          $status == 0 ;
 486          $status = $db->seq($key, $value, R_NEXT() ) ) {
 487
 488         return 0 if $key eq $origkey and $value eq $value_wanted ;
 489     }
 490
 491     return $status ;
 492 }
 493
 494 sub del_dup
 495 {
 496     croak "Usage: \$db->del_dup(key,value)\n"
 497         unless @_ == 3 ;
 498
 499     my $db        = shift ;
 500     my ($key, $value) = @_ ;
 501     my ($status) = $db->find_dup($key, $value) ;
 502     return $status if $status != 0 ;
 503
 504     $status = $db->del($key, R_CURSOR() ) ;
 505     return $status ;
 506 }
 507
 508 sub get_dup
 509 {
 510     croak "Usage: \$db->get_dup(key [,flag])\n"
 511         unless @_ == 2 or @_ == 3 ;
 512
 513     my $db        = shift ;
 514     my $key       = shift ;
 515     my $flag      = shift ;
 516     my $value     = 0 ;
 517     my $origkey   = $key ;
 518     my $wantarray = wantarray ;
 519     my %values    = () ;
 520     my @values    = () ;
 521     my $counter   = 0 ;
 522     my $status    = 0 ;
 523
 524     # iterate through the database until either EOF ($status == 0)
 525     # or a different key is encountered ($key ne $origkey).
 526     for ($status = $db->seq($key, $value, R_CURSOR()) ;
 527          $status == 0 and $key eq $origkey ;
 528          $status = $db->seq($key, $value, R_NEXT()) ) {
 529
 530         # save the value or count number of matches
 531         if ($wantarray) {
 532             if ($flag)
 533                 { ++ $values{$value} }
 534             else
 535                 { push (@values, $value) }
 536         }
 537         else
 538             { ++ $counter }
 539
 540     }
 541
 542     return ($wantarray ? ($flag ? %values : @values) : $counter) ;
 543 }
 544
 545
 546 1;
 547 __END__
 548
 549 =head1 NAME
 550
 551 DB_File - Perl5 access to Berkeley DB version 1.x
 552
 553 =head1 SYNOPSIS
 554
 555  use DB_File;
 556
 557  [$X =] tie %hash,  'DB_File', [$filename, $flags, $mode, $DB_HASH] ;
 558  [$X =] tie %hash,  'DB_File', $filename, $flags, $mode, $DB_BTREE ;
 559  [$X =] tie @array, 'DB_File', $filename, $flags, $mode, $DB_RECNO ;
 560
 561  $status = $X->del($key [, $flags]) ;
 562  $status = $X->put($key, $value [, $flags]) ;
 563  $status = $X->get($key, $value [, $flags]) ;
 564  $status = $X->seq($key, $value, $flags) ;
 565  $status = $X->sync([$flags]) ;
 566  $status = $X->fd ;
 567
 568  # BTREE only
 569  $count = $X->get_dup($key) ;
 570  @list  = $X->get_dup($key) ;
 571  %list  = $X->get_dup($key, 1) ;
 572  $status = $X->find_dup($key, $value) ;
 573  $status = $X->del_dup($key, $value) ;
 574
 575  # RECNO only
 576  $a = $X->length;
 577  $a = $X->pop ;
 578  $X->push(list);
 579  $a = $X->shift;
 580  $X->unshift(list);
 581  @r = $X->splice(offset, length, elements);
 582
 583  # DBM Filters
 584  $old_filter = $db->filter_store_key  ( sub { ... } ) ;
 585  $old_filter = $db->filter_store_value( sub { ... } ) ;
 586  $old_filter = $db->filter_fetch_key  ( sub { ... } ) ;
 587  $old_filter = $db->filter_fetch_value( sub { ... } ) ;
 588
 589  untie %hash ;
 590  untie @array ;
 591
 592 =head1 DESCRIPTION
 593
 594 B<DB_File> is a module which allows Perl programs to make use of the
 595 facilities provided by Berkeley DB version 1.x (if you have a newer
 596 version of DB, see L<Using DB_File with Berkeley DB version 2 or greater>).
 597 It is assumed that you have a copy of the Berkeley DB manual pages at
 598 hand when reading this documentation. The interface defined here
 599 mirrors the Berkeley DB interface closely.
 600
 601 Berkeley DB is a C library which provides a consistent interface to a
 602 number of database formats.  B<DB_File> provides an interface to all
 603 three of the database types currently supported by Berkeley DB.
 604
 605 The file types are:
 606
 607 =over 5
 608
 609 =item B<DB_HASH>
 610
 611 This database type allows arbitrary key/value pairs to be stored in data
 612 files. This is equivalent to the functionality provided by other
 613 hashing packages like DBM, NDBM, ODBM, GDBM, and SDBM. Remember though,
 614 the files created using DB_HASH are not compatible with any of the
 615 other packages mentioned.
 616
 617 A default hashing algorithm, which will be adequate for most
 618 applications, is built into Berkeley DB. If you do need to use your own
 619 hashing algorithm it is possible to write your own in Perl and have
 620 B<DB_File> use it instead.
 621
 622 =item B<DB_BTREE>
 623
 624 The btree format allows arbitrary key/value pairs to be stored in a
 625 sorted, balanced binary tree.
 626
 627 As with the DB_HASH format, it is possible to provide a user defined
 628 Perl routine to perform the comparison of keys. By default, though, the
 629 keys are stored in lexical order.
 630
 631 =item B<DB_RECNO>
 632
 633 DB_RECNO allows both fixed-length and variable-length flat text files
 634 to be manipulated using the same key/value pair interface as in DB_HASH
 635 and DB_BTREE.  In this case the key will consist of a record (line)
 636 number.
 637
 638 =back
 639
 640 =head2 Using DB_File with Berkeley DB version 2 or greater
 641
 642 Although B<DB_File> is intended to be used with Berkeley DB version 1,
 643 it can also be used with version 2, 3 or 4. In this case the interface is
 644 limited to the functionality provided by Berkeley DB 1.x. Anywhere the
 645 version 2 or greater interface differs, B<DB_File> arranges for it to work
 646 like version 1. This feature allows B<DB_File> scripts that were built
 647 with version 1 to be migrated to version 2 or greater without any changes.
 648
 649 If you want to make use of the new features available in Berkeley DB
 650 2.x or greater, use the Perl module B<BerkeleyDB> instead.
 651
 652 B<Note:> The database file format has changed multiple times in Berkeley
 653 DB version 2, 3 and 4. If you cannot recreate your databases, you
 654 must dump any existing databases with either the C<db_dump> or the
 655 C<db_dump185> utility that comes with Berkeley DB.
 656 Once you have rebuilt DB_File to use Berkeley DB version 2 or greater,
 657 your databases can be recreated using C<db_load>. Refer to the Berkeley DB
 658 documentation for further details.
 659
 660 Please read L<"COPYRIGHT"> before using version 2.x or greater of Berkeley
 661 DB with DB_File.
 662
 663 =head2 Interface to Berkeley DB
 664
 665 B<DB_File> allows access to Berkeley DB files using the tie() mechanism
 666 in Perl 5 (for full details, see L<perlfunc/tie()>). This facility
 667 allows B<DB_File> to access Berkeley DB files using either an
 668 associative array (for DB_HASH & DB_BTREE file types) or an ordinary
 669 array (for the DB_RECNO file type).
 670
 671 In addition to the tie() interface, it is also possible to access most
 672 of the functions provided in the Berkeley DB API directly.
 673 See L<THE API INTERFACE>.
 674
 675 =head2 Opening a Berkeley DB Database File
 676
 677 Berkeley DB uses the function dbopen() to open or create a database.
 678 Here is the C prototype for dbopen():
 679
 680       DB*
 681       dbopen (const char * file, int flags, int mode,
 682               DBTYPE type, const void * openinfo)
 683
 684 The parameter C<type> is an enumeration which specifies which of the 3
 685 interface methods (DB_HASH, DB_BTREE or DB_RECNO) is to be used.
 686 Depending on which of these is actually chosen, the final parameter,
 687 I<openinfo> points to a data structure which allows tailoring of the
 688 specific interface method.
 689
 690 This interface is handled slightly differently in B<DB_File>. Here is
 691 an equivalent call using B<DB_File>:
 692
 693         tie %array, 'DB_File', $filename, $flags, $mode, $DB_HASH ;
 694
 695 The C<filename>, C<flags> and C<mode> parameters are the direct
 696 equivalent of their dbopen() counterparts. The final parameter $DB_HASH
 697 performs the function of both the C<type> and C<openinfo> parameters in
 698 dbopen().
 699
 700 In the example above $DB_HASH is actually a pre-defined reference to a
 701 hash object. B<DB_File> has three of these pre-defined references.
 702 Apart from $DB_HASH, there is also $DB_BTREE and $DB_RECNO.
 703
 704 The keys allowed in each of these pre-defined references is limited to
 705 the names used in the equivalent C structure. So, for example, the
 706 $DB_HASH reference will only allow keys called C<bsize>, C<cachesize>,
 707 C<ffactor>, C<hash>, C<lorder> and C<nelem>.
 708
 709 To change one of these elements, just assign to it like this:
 710
 711         $DB_HASH->{'cachesize'} = 10000 ;
 712
 713 The three predefined variables $DB_HASH, $DB_BTREE and $DB_RECNO are
 714 usually adequate for most applications.  If you do need to create extra
 715 instances of these objects, constructors are available for each file
 716 type.
 717
 718 Here are examples of the constructors and the valid options available
 719 for DB_HASH, DB_BTREE and DB_RECNO respectively.
 720
 721      $a = new DB_File::HASHINFO ;
 722      $a->{'bsize'} ;
 723      $a->{'cachesize'} ;
 724      $a->{'ffactor'};
 725      $a->{'hash'} ;
 726      $a->{'lorder'} ;
 727      $a->{'nelem'} ;
 728
 729      $b = new DB_File::BTREEINFO ;
 730      $b->{'flags'} ;
 731      $b->{'cachesize'} ;
 732      $b->{'maxkeypage'} ;
 733      $b->{'minkeypage'} ;
 734      $b->{'psize'} ;
 735      $b->{'compare'} ;
 736      $b->{'prefix'} ;
 737      $b->{'lorder'} ;
 738
 739      $c = new DB_File::RECNOINFO ;
 740      $c->{'bval'} ;
 741      $c->{'cachesize'} ;
 742      $c->{'psize'} ;
 743      $c->{'flags'} ;
 744      $c->{'lorder'} ;
 745      $c->{'reclen'} ;
 746      $c->{'bfname'} ;
 747
 748 The values stored in the hashes above are mostly the direct equivalent
 749 of their C counterpart. Like their C counterparts, all are set to a
 750 default values - that means you don't have to set I<all> of the
 751 values when you only want to change one. Here is an example:
 752
 753      $a = new DB_File::HASHINFO ;
 754      $a->{'cachesize'} =  12345 ;
 755      tie %y, 'DB_File', "filename", $flags, 0777, $a ;
 756
 757 A few of the options need extra discussion here. When used, the C
 758 equivalent of the keys C<hash>, C<compare> and C<prefix> store pointers
 759 to C functions. In B<DB_File> these keys are used to store references
 760 to Perl subs. Below are templates for each of the subs:
 761
 762     sub hash
 763     {
 764         my ($data) = @_ ;
 765         ...
 766         # return the hash value for $data
 767         return $hash ;
 768     }
 769
 770     sub compare
 771     {
 772         my ($key, $key2) = @_ ;
 773         ...
 774         # return  0 if $key1 eq $key2
 775         #        -1 if $key1 lt $key2
 776         #         1 if $key1 gt $key2
 777         return (-1 , 0 or 1) ;
 778     }
 779
 780     sub prefix
 781     {
 782         my ($key, $key2) = @_ ;
 783         ...
 784         # return number of bytes of $key2 which are
 785         # necessary to determine that it is greater than $key1
 786         return $bytes ;
 787     }
 788
 789 See L<Changing the BTREE sort order> for an example of using the
 790 C<compare> template.
 791
 792 If you are using the DB_RECNO interface and you intend making use of
 793 C<bval>, you should check out L<The 'bval' Option>.
 794
 795 =head2 Default Parameters
 796
 797 It is possible to omit some or all of the final 4 parameters in the
 798 call to C<tie> and let them take default values. As DB_HASH is the most
 799 common file format used, the call:
 800
 801     tie %A, "DB_File", "filename" ;
 802
 803 is equivalent to:
 804
 805     tie %A, "DB_File", "filename", O_CREAT|O_RDWR, 0666, $DB_HASH ;
 806
 807 It is also possible to omit the filename parameter as well, so the
 808 call:
 809
 810     tie %A, "DB_File" ;
 811
 812 is equivalent to:
 813
 814     tie %A, "DB_File", undef, O_CREAT|O_RDWR, 0666, $DB_HASH ;
 815
 816 See L<In Memory Databases> for a discussion on the use of C<undef>
 817 in place of a filename.
 818
 819 =head2 In Memory Databases
 820
 821 Berkeley DB allows the creation of in-memory databases by using NULL
 822 (that is, a C<(char *)0> in C) in place of the filename.  B<DB_File>
 823 uses C<undef> instead of NULL to provide this functionality.
 824
 825 =head1 DB_HASH
 826
 827 The DB_HASH file format is probably the most commonly used of the three
 828 file formats that B<DB_File> supports. It is also very straightforward
 829 to use.
 830
 831 =head2 A Simple Example
 832
 833 This example shows how to create a database, add key/value pairs to the
 834 database, delete keys/value pairs and finally how to enumerate the
 835 contents of the database.
 836
 837     use warnings ;
 838     use strict ;
 839     use DB_File ;
 840     our (%h, $k, $v) ;
 841
 842     unlink "fruit" ;
 843     tie %h, "DB_File", "fruit", O_RDWR|O_CREAT, 0666, $DB_HASH
 844         or die "Cannot open file 'fruit': $!\n";
 845
 846     # Add a few key/value pairs to the file
 847     $h{"apple"} = "red" ;
 848     $h{"orange"} = "orange" ;
 849     $h{"banana"} = "yellow" ;
 850     $h{"tomato"} = "red" ;
 851
 852     # Check for existence of a key
 853     print "Banana Exists\n\n" if $h{"banana"} ;
 854
 855     # Delete a key/value pair.
 856     delete $h{"apple"} ;
 857
 858     # print the contents of the file
 859     while (($k, $v) = each %h)
 860       { print "$k -> $v\n" }
 861
 862     untie %h ;
 863
 864 here is the output:
 865
 866     Banana Exists
 867
 868     orange -> orange
 869     tomato -> red
 870     banana -> yellow
 871
 872 Note that the like ordinary associative arrays, the order of the keys
 873 retrieved is in an apparently random order.
 874
 875 =head1 DB_BTREE
 876
 877 The DB_BTREE format is useful when you want to store data in a given
 878 order. By default the keys will be stored in lexical order, but as you
 879 will see from the example shown in the next section, it is very easy to
 880 define your own sorting function.
 881
 882 =head2 Changing the BTREE sort order
 883
 884 This script shows how to override the default sorting algorithm that
 885 BTREE uses. Instead of using the normal lexical ordering, a case
 886 insensitive compare function will be used.
 887
 888     use warnings ;
 889     use strict ;
 890     use DB_File ;
 891
 892     my %h ;
 893
 894     sub Compare
 895     {
 896         my ($key1, $key2) = @_ ;
 897         "\L$key1" cmp "\L$key2" ;
 898     }
 899
 900     # specify the Perl sub that will do the comparison
 901     $DB_BTREE->{'compare'} = \&Compare ;
 902
 903     unlink "tree" ;
 904     tie %h, "DB_File", "tree", O_RDWR|O_CREAT, 0666, $DB_BTREE
 905         or die "Cannot open file 'tree': $!\n" ;
 906
 907     # Add a key/value pair to the file
 908     $h{'Wall'} = 'Larry' ;
 909     $h{'Smith'} = 'John' ;
 910     $h{'mouse'} = 'mickey' ;
 911     $h{'duck'}  = 'donald' ;
 912
 913     # Delete
 914     delete $h{"duck"} ;
 915
 916     # Cycle through the keys printing them in order.
 917     # Note it is not necessary to sort the keys as
 918     # the btree will have kept them in order automatically.
 919     foreach (keys %h)
 920       { print "$_\n" }
 921
 922     untie %h ;
 923
 924 Here is the output from the code above.
 925
 926     mouse
 927     Smith
 928     Wall
 929
 930 There are a few point to bear in mind if you want to change the
 931 ordering in a BTREE database:
 932
 933 =over 5
 934
 935 =item 1.
 936
 937 The new compare function must be specified when you create the database.
 938
 939 =item 2.
 940
 941 You cannot change the ordering once the database has been created. Thus
 942 you must use the same compare function every time you access the
 943 database.
 944
 945 =item 3
 946
 947 Duplicate keys are entirely defined by the comparison function.
 948 In the case-insensitive example above, the keys: 'KEY' and 'key'
 949 would be considered duplicates, and assigning to the second one
 950 would overwrite the first. If duplicates are allowed for (with the
 951 R_DUPS flag discussed below), only a single copy of duplicate keys
 952 is stored in the database --- so (again with example above) assigning
 953 three values to the keys: 'KEY', 'Key', and 'key' would leave just
 954 the first key: 'KEY' in the database with three values. For some
 955 situations this results in information loss, so care should be taken
 956 to provide fully qualified comparison functions when necessary.
 957 For example, the above comparison routine could be modified to
 958 additionally compare case-sensitively if two keys are equal in the
 959 case insensitive comparison:
 960
 961     sub compare {
 962         my($key1, $key2) = @_;
 963         lc $key1 cmp lc $key2 ||
 964         $key1 cmp $key2;
 965     }
 966
 967 And now you will only have duplicates when the keys themselves
 968 are truly the same. (note: in versions of the db library prior to
 969 about November 1996, such duplicate keys were retained so it was
 970 possible to recover the original keys in sets of keys that
 971 compared as equal).
 972
 973
 974 =back
 975
 976 =head2 Handling Duplicate Keys
 977
 978 The BTREE file type optionally allows a single key to be associated
 979 with an arbitrary number of values. This option is enabled by setting
 980 the flags element of C<$DB_BTREE> to R_DUP when creating the database.
 981
 982 There are some difficulties in using the tied hash interface if you
 983 want to manipulate a BTREE database with duplicate keys. Consider this
 984 code:
 985
 986     use warnings ;
 987     use strict ;
 988     use DB_File ;
 989
 990     my ($filename, %h) ;
 991
 992     $filename = "tree" ;
 993     unlink $filename ;
 994
 995     # Enable duplicate records
 996     $DB_BTREE->{'flags'} = R_DUP ;
 997
 998     tie %h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_BTREE
 999         or die "Cannot open $filename: $!\n";
1000
1001     # Add some key/value pairs to the file
1002     $h{'Wall'} = 'Larry' ;
1003     $h{'Wall'} = 'Brick' ; # Note the duplicate key
1004     $h{'Wall'} = 'Brick' ; # Note the duplicate key and value
1005     $h{'Smith'} = 'John' ;
1006     $h{'mouse'} = 'mickey' ;
1007
1008     # iterate through the associative array
1009     # and print each key/value pair.
1010     foreach (sort keys %h)
1011       { print "$_  -> $h{$_}\n" }
1012
1013     untie %h ;
1014
1015 Here is the output:
1016
1017     Smith   -> John
1018     Wall    -> Larry
1019     Wall    -> Larry
1020     Wall    -> Larry
1021     mouse   -> mickey
1022
1023 As you can see 3 records have been successfully created with key C<Wall>
1024 - the only thing is, when they are retrieved from the database they
1025 I<seem> to have the same value, namely C<Larry>. The problem is caused
1026 by the way that the associative array interface works. Basically, when
1027 the associative array interface is used to fetch the value associated
1028 with a given key, it will only ever retrieve the first value.
1029
1030 Although it may not be immediately obvious from the code above, the
1031 associative array interface can be used to write values with duplicate
1032 keys, but it cannot be used to read them back from the database.
1033
1034 The way to get around this problem is to use the Berkeley DB API method
1035 called C<seq>.  This method allows sequential access to key/value
1036 pairs. See L<THE API INTERFACE> for details of both the C<seq> method
1037 and the API in general.
1038
1039 Here is the script above rewritten using the C<seq> API method.
1040
1041     use warnings ;
1042     use strict ;
1043     use DB_File ;
1044
1045     my ($filename, $x, %h, $status, $key, $value) ;
1046
1047     $filename = "tree" ;
1048     unlink $filename ;
1049
1050     # Enable duplicate records
1051     $DB_BTREE->{'flags'} = R_DUP ;
1052
1053     $x = tie %h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_BTREE
1054         or die "Cannot open $filename: $!\n";
1055
1056     # Add some key/value pairs to the file
1057     $h{'Wall'} = 'Larry' ;
1058     $h{'Wall'} = 'Brick' ; # Note the duplicate key
1059     $h{'Wall'} = 'Brick' ; # Note the duplicate key and value
1060     $h{'Smith'} = 'John' ;
1061     $h{'mouse'} = 'mickey' ;
1062
1063     # iterate through the btree using seq
1064     # and print each key/value pair.
1065     $key = $value = 0 ;
1066     for ($status = $x->seq($key, $value, R_FIRST) ;
1067          $status == 0 ;
1068          $status = $x->seq($key, $value, R_NEXT) )
1069       {  print "$key -> $value\n" }
1070
1071     undef $x ;
1072     untie %h ;
1073
1074 that prints:
1075
1076     Smith   -> John
1077     Wall    -> Brick
1078     Wall    -> Brick
1079     Wall    -> Larry
1080     mouse   -> mickey
1081
1082 This time we have got all the key/value pairs, including the multiple
1083 values associated with the key C<Wall>.
1084
1085 To make life easier when dealing with duplicate keys, B<DB_File> comes with
1086 a few utility methods.
1087
1088 =head2 The get_dup() Method
1089
1090 The C<get_dup> method assists in
1091 reading duplicate values from BTREE databases. The method can take the
1092 following forms:
1093
1094     $count = $x->get_dup($key) ;
1095     @list  = $x->get_dup($key) ;
1096     %list  = $x->get_dup($key, 1) ;
1097
1098 In a scalar context the method returns the number of values associated
1099 with the key, C<$key>.
1100
1101 In list context, it returns all the values which match C<$key>. Note
1102 that the values will be returned in an apparently random order.
1103
1104 In list context, if the second parameter is present and evaluates
1105 TRUE, the method returns an associative array. The keys of the
1106 associative array correspond to the values that matched in the BTREE
1107 and the values of the array are a count of the number of times that
1108 particular value occurred in the BTREE.
1109
1110 So assuming the database created above, we can use C<get_dup> like
1111 this:
1112
1113     use warnings ;
1114     use strict ;
1115     use DB_File ;
1116
1117     my ($filename, $x, %h) ;
1118
1119     $filename = "tree" ;
1120
1121     # Enable duplicate records
1122     $DB_BTREE->{'flags'} = R_DUP ;
1123
1124     $x = tie %h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_BTREE
1125         or die "Cannot open $filename: $!\n";
1126
1127     my $cnt  = $x->get_dup("Wall") ;
1128     print "Wall occurred $cnt times\n" ;
1129
1130     my %hash = $x->get_dup("Wall", 1) ;
1131     print "Larry is there\n" if $hash{'Larry'} ;
1132     print "There are $hash{'Brick'} Brick Walls\n" ;
1133
1134     my @list = sort $x->get_dup("Wall") ;
1135     print "Wall =>      [@list]\n" ;
1136
1137     @list = $x->get_dup("Smith") ;
1138     print "Smith =>     [@list]\n" ;
1139
1140     @list = $x->get_dup("Dog") ;
1141     print "Dog =>       [@list]\n" ;
1142
1143
1144 and it will print:
1145
1146     Wall occurred 3 times
1147     Larry is there
1148     There are 2 Brick Walls
1149     Wall =>     [Brick Brick Larry]
1150     Smith =>    [John]
1151     Dog =>      []
1152
1153 =head2 The find_dup() Method
1154
1155     $status = $X->find_dup($key, $value) ;
1156
1157 This method checks for the existence of a specific key/value pair. If the
1158 pair exists, the cursor is left pointing to the pair and the method
1159 returns 0. Otherwise the method returns a non-zero value.
1160
1161 Assuming the database from the previous example:
1162
1163     use warnings ;
1164     use strict ;
1165     use DB_File ;
1166
1167     my ($filename, $x, %h, $found) ;
1168
1169     $filename = "tree" ;
1170
1171     # Enable duplicate records
1172     $DB_BTREE->{'flags'} = R_DUP ;
1173
1174     $x = tie %h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_BTREE
1175         or die "Cannot open $filename: $!\n";
1176
1177     $found = ( $x->find_dup("Wall", "Larry") == 0 ? "" : "not") ;
1178     print "Larry Wall is $found there\n" ;
1179
1180     $found = ( $x->find_dup("Wall", "Harry") == 0 ? "" : "not") ;
1181     print "Harry Wall is $found there\n" ;
1182
1183     undef $x ;
1184     untie %h ;
1185
1186 prints this
1187
1188     Larry Wall is  there
1189     Harry Wall is not there
1190
1191
1192 =head2 The del_dup() Method
1193
1194     $status = $X->del_dup($key, $value) ;
1195
1196 This method deletes a specific key/value pair. It returns
1197 0 if they exist and have been deleted successfully.
1198 Otherwise the method returns a non-zero value.
1199
1200 Again assuming the existence of the C<tree> database
1201
1202     use warnings ;
1203     use strict ;
1204     use DB_File ;
1205
1206     my ($filename, $x, %h, $found) ;
1207
1208     $filename = "tree" ;
1209
1210     # Enable duplicate records
1211     $DB_BTREE->{'flags'} = R_DUP ;
1212
1213     $x = tie %h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_BTREE
1214         or die "Cannot open $filename: $!\n";
1215
1216     $x->del_dup("Wall", "Larry") ;
1217
1218     $found = ( $x->find_dup("Wall", "Larry") == 0 ? "" : "not") ;
1219     print "Larry Wall is $found there\n" ;
1220
1221     undef $x ;
1222     untie %h ;
1223
1224 prints this
1225
1226     Larry Wall is not there
1227
1228 =head2 Matching Partial Keys
1229
1230 The BTREE interface has a feature which allows partial keys to be
1231 matched. This functionality is I<only> available when the C<seq> method
1232 is used along with the R_CURSOR flag.
1233
1234     $x->seq($key, $value, R_CURSOR) ;
1235
1236 Here is the relevant quote from the dbopen man page where it defines
1237 the use of the R_CURSOR flag with seq:
1238
1239     Note, for the DB_BTREE access method, the returned key is not
1240     necessarily an exact match for the specified key. The returned key
1241     is the smallest key greater than or equal to the specified key,
1242     permitting partial key matches and range searches.
1243
1244 In the example script below, the C<match> sub uses this feature to find
1245 and print the first matching key/value pair given a partial key.
1246
1247     use warnings ;
1248     use strict ;
1249     use DB_File ;
1250     use Fcntl ;
1251
1252     my ($filename, $x, %h, $st, $key, $value) ;
1253
1254     sub match
1255     {
1256         my $key = shift ;
1257         my $value = 0;
1258         my $orig_key = $key ;
1259         $x->seq($key, $value, R_CURSOR) ;
1260         print "$orig_key\t-> $key\t-> $value\n" ;
1261     }
1262
1263     $filename = "tree" ;
1264     unlink $filename ;
1265
1266     $x = tie %h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_BTREE
1267         or die "Cannot open $filename: $!\n";
1268
1269     # Add some key/value pairs to the file
1270     $h{'mouse'} = 'mickey' ;
1271     $h{'Wall'} = 'Larry' ;
1272     $h{'Walls'} = 'Brick' ;
1273     $h{'Smith'} = 'John' ;
1274
1275
1276     $key = $value = 0 ;
1277     print "IN ORDER\n" ;
1278     for ($st = $x->seq($key, $value, R_FIRST) ;
1279          $st == 0 ;
1280          $st = $x->seq($key, $value, R_NEXT) )
1281
1282       {  print "$key    -> $value\n" }
1283
1284     print "\nPARTIAL MATCH\n" ;
1285
1286     match "Wa" ;
1287     match "A" ;
1288     match "a" ;
1289
1290     undef $x ;
1291     untie %h ;
1292
1293 Here is the output:
1294
1295     IN ORDER
1296     Smith -> John
1297     Wall  -> Larry
1298     Walls -> Brick
1299     mouse -> mickey
1300
1301     PARTIAL MATCH
1302     Wa -> Wall  -> Larry
1303     A  -> Smith -> John
1304     a  -> mouse -> mickey
1305
1306 =head1 DB_RECNO
1307
1308 DB_RECNO provides an interface to flat text files. Both variable and
1309 fixed length records are supported.
1310
1311 In order to make RECNO more compatible with Perl, the array offset for
1312 all RECNO arrays begins at 0 rather than 1 as in Berkeley DB.
1313
1314 As with normal Perl arrays, a RECNO array can be accessed using
1315 negative indexes. The index -1 refers to the last element of the array,
1316 -2 the second last, and so on. Attempting to access an element before
1317 the start of the array will raise a fatal run-time error.
1318
1319 =head2 The 'bval' Option
1320
1321 The operation of the bval option warrants some discussion. Here is the
1322 definition of bval from the Berkeley DB 1.85 recno manual page:
1323
1324     The delimiting byte to be used to mark  the  end  of  a
1325     record for variable-length records, and the pad charac-
1326     ter for fixed-length records.  If no  value  is  speci-
1327     fied,  newlines  (``\n'')  are  used to mark the end of
1328     variable-length records and  fixed-length  records  are
1329     padded with spaces.
1330
1331 The second sentence is wrong. In actual fact bval will only default to
1332 C<"\n"> when the openinfo parameter in dbopen is NULL. If a non-NULL
1333 openinfo parameter is used at all, the value that happens to be in bval
1334 will be used. That means you always have to specify bval when making
1335 use of any of the options in the openinfo parameter. This documentation
1336 error will be fixed in the next release of Berkeley DB.
1337
1338 That clarifies the situation with regards Berkeley DB itself. What
1339 about B<DB_File>? Well, the behavior defined in the quote above is
1340 quite useful, so B<DB_File> conforms to it.
1341
1342 That means that you can specify other options (e.g. cachesize) and
1343 still have bval default to C<"\n"> for variable length records, and
1344 space for fixed length records.
1345
1346 Also note that the bval option only allows you to specify a single byte
1347 as a delimeter.
1348
1349 =head2 A Simple Example
1350
1351 Here is a simple example that uses RECNO (if you are using a version
1352 of Perl earlier than 5.004_57 this example won't work -- see
1353 L<Extra RECNO Methods> for a workaround).
1354
1355     use warnings ;
1356     use strict ;
1357     use DB_File ;
1358
1359     my $filename = "text" ;
1360     unlink $filename ;
1361
1362     my @h ;
1363     tie @h, "DB_File", $filename, O_RDWR|O_CREAT, 0666, $DB_RECNO
1364         or die "Cannot open file 'text': $!\n" ;
1365
1366     # Add a few key/value pairs to the file
1367     $h[0] = "orange" ;
1368     $h[1] = "blue" ;
1369     $h[2] = "yellow" ;
1370
1371     push @h, "green", "black" ;
1372
1373     my $elements = scalar @h ;
1374     print "The array contains $elements entries\n" ;
1375
1376     my $last = pop @h ;
1377     print "popped $last\n" ;
1378
1379     unshift @h, "white" ;
1380     my $first = shift @h ;
1381     print "shifted $first\n" ;
1382
1383     # Check for existence of a key
1384     print "Element 1 Exists with value $h[1]\n" if $h[1] ;
1385
1386     # use a negative index
1387     print "The last element is $h[-1]\n" ;
1388     print "The 2nd last element is $h[-2]\n" ;
1389
1390     untie @h ;
1391
1392 Here is the output from the script:
1393
1394     The array contains 5 entries
1395     popped black
1396     shifted white
1397     Element 1 Exists with value blue
1398     The last element is green
1399     The 2nd last element is yellow
1400
1401 =head2 Extra RECNO Methods
1402
1403 If you are using a version of Perl earlier than 5.004_57, the tied
1404 array interface is quite limited. In the example script above
1405 C<push>, C<pop>, C<shift>, C<unshift>
1406 or determining the array length will not work with a tied array.
1407
1408 To make the interface more useful for older versions of Perl, a number
1409 of methods are supplied with B<DB_File> to simulate the missing array
1410 operations. All these methods are accessed via the object returned from
1411 the tie call.
1412
1413 Here are the methods:
1414
1415 =over 5
1416
1417 =item B<$X-E<gt>push(list) ;>
1418
1419 Pushes the elements of C<list> to the end of the array.
1420
1421 =item B<$value = $X-E<gt>pop ;>
1422
1423 Removes and returns the last element of the array.
1424
1425 =item B<$X-E<gt>shift>
1426
1427 Removes and returns the first element of the array.
1428
1429 =item B<$X-E<gt>unshift(list) ;>
1430
1431 Pushes the elements of C<list> to the start of the array.
1432
1433 =item B<$X-E<gt>length>
1434
1435 Returns the number of elements in the array.
1436
1437 =item B<$X-E<gt>splice(offset, length, elements);>
1438
1439 Returns a splice of the the array.
1440
1441 =back
1442
1443 =head2 Another Example
1444
1445 Here is a more complete example that makes use of some of the methods
1446 described above. It also makes use of the API interface directly (see
1447 L<THE API INTERFACE>).
1448
1449     use warnings ;
1450     use strict ;
1451     my (@h, $H, $file, $i) ;
1452     use DB_File ;
1453     use Fcntl ;
1454
1455     $file = "text" ;
1456
1457     unlink $file ;
1458
1459     $H = tie @h, "DB_File", $file, O_RDWR|O_CREAT, 0666, $DB_RECNO
1460         or die "Cannot open file $file: $!\n" ;
1461
1462     # first create a text file to play with
1463     $h[0] = "zero" ;
1464     $h[1] = "one" ;
1465     $h[2] = "two" ;
1466     $h[3] = "three" ;
1467     $h[4] = "four" ;
1468
1469
1470     # Print the records in order.
1471     #
1472     # The length method is needed here because evaluating a tied
1473     # array in a scalar context does not return the number of
1474     # elements in the array.
1475
1476     print "\nORIGINAL\n" ;
1477     foreach $i (0 .. $H->length - 1) {
1478         print "$i: $h[$i]\n" ;
1479     }
1480
1481     # use the push & pop methods
1482     $a = $H->pop ;
1483     $H->push("last") ;
1484     print "\nThe last record was [$a]\n" ;
1485
1486     # and the shift & unshift methods
1487     $a = $H->shift ;
1488     $H->unshift("first") ;
1489     print "The first record was [$a]\n" ;
1490
1491     # Use the API to add a new record after record 2.
1492     $i = 2 ;
1493     $H->put($i, "Newbie", R_IAFTER) ;
1494
1495     # and a new record before record 1.
1496     $i = 1 ;
1497     $H->put($i, "New One", R_IBEFORE) ;
1498
1499     # delete record 3
1500     $H->del(3) ;
1501
1502     # now print the records in reverse order
1503     print "\nREVERSE\n" ;
1504     for ($i = $H->length - 1 ; $i >= 0 ; -- $i)
1505       { print "$i: $h[$i]\n" }
1506
1507     # same again, but use the API functions instead
1508     print "\nREVERSE again\n" ;
1509     my ($s, $k, $v)  = (0, 0, 0) ;
1510     for ($s = $H->seq($k, $v, R_LAST) ;
1511              $s == 0 ;
1512              $s = $H->seq($k, $v, R_PREV))
1513       { print "$k: $v\n" }
1514
1515     undef $H ;
1516     untie @h ;
1517
1518 and this is what it outputs:
1519
1520     ORIGINAL
1521     0: zero
1522     1: one
1523     2: two
1524     3: three
1525     4: four
1526
1527     The last record was [four]
1528     The first record was [zero]
1529
1530     REVERSE
1531     5: last
1532     4: three
1533     3: Newbie
1534     2: one
1535     1: New One
1536     0: first
1537
1538     REVERSE again
1539     5: last
1540     4: three
1541     3: Newbie
1542     2: one
1543     1: New One
1544     0: first
1545
1546 Notes:
1547
1548 =over 5
1549
1550 =item 1.
1551
1552 Rather than iterating through the array, C<@h> like this:
1553
1554     foreach $i (@h)
1555
1556 it is necessary to use either this:
1557
1558     foreach $i (0 .. $H->length - 1)
1559
1560 or this:
1561
1562     for ($a = $H->get($k, $v, R_FIRST) ;
1563          $a == 0 ;
1564          $a = $H->get($k, $v, R_NEXT) )
1565
1566 =item 2.
1567
1568 Notice that both times the C<put> method was used the record index was
1569 specified using a variable, C<$i>, rather than the literal value
1570 itself. This is because C<put> will return the record number of the
1571 inserted line via that parameter.
1572
1573 =back
1574
1575 =head1 THE API INTERFACE
1576
1577 As well as accessing Berkeley DB using a tied hash or array, it is also
1578 possible to make direct use of most of the API functions defined in the
1579 Berkeley DB documentation.
1580
1581 To do this you need to store a copy of the object returned from the tie.
1582
1583         $db = tie %hash, "DB_File", "filename" ;
1584
1585 Once you have done that, you can access the Berkeley DB API functions
1586 as B<DB_File> methods directly like this:
1587
1588         $db->put($key, $value, R_NOOVERWRITE) ;
1589
1590 B<Important:> If you have saved a copy of the object returned from
1591 C<tie>, the underlying database file will I<not> be closed until both
1592 the tied variable is untied and all copies of the saved object are
1593 destroyed.
1594
1595     use DB_File ;
1596     $db = tie %hash, "DB_File", "filename"
1597         or die "Cannot tie filename: $!" ;
1598     ...
1599     undef $db ;
1600     untie %hash ;
1601
1602 See L<The untie() Gotcha> for more details.
1603
1604 All the functions defined in L<dbopen> are available except for
1605 close() and dbopen() itself. The B<DB_File> method interface to the
1606 supported functions have been implemented to mirror the way Berkeley DB
1607 works whenever possible. In particular note that:
1608
1609 =over 5
1610
1611 =item *
1612
1613 The methods return a status value. All return 0 on success.
1614 All return -1 to signify an error and set C<$!> to the exact
1615 error code. The return code 1 generally (but not always) means that the
1616 key specified did not exist in the database.
1617
1618 Other return codes are defined. See below and in the Berkeley DB
1619 documentation for details. The Berkeley DB documentation should be used
1620 as the definitive source.
1621
1622 =item *
1623
1624 Whenever a Berkeley DB function returns data via one of its parameters,
1625 the equivalent B<DB_File> method does exactly the same.
1626
1627 =item *
1628
1629 If you are careful, it is possible to mix API calls with the tied
1630 hash/array interface in the same piece of code. Although only a few of
1631 the methods used to implement the tied interface currently make use of
1632 the cursor, you should always assume that the cursor has been changed
1633 any time the tied hash/array interface is used. As an example, this
1634 code will probably not do what you expect:
1635
1636     $X = tie %x, 'DB_File', $filename, O_RDWR|O_CREAT, 0777, $DB_BTREE
1637         or die "Cannot tie $filename: $!" ;
1638
1639     # Get the first key/value pair and set  the cursor
1640     $X->seq($key, $value, R_FIRST) ;
1641
1642     # this line will modify the cursor
1643     $count = scalar keys %x ;
1644
1645     # Get the second key/value pair.
1646     # oops, it didn't, it got the last key/value pair!
1647     $X->seq($key, $value, R_NEXT) ;
1648
1649 The code above can be rearranged to get around the problem, like this:
1650
1651     $X = tie %x, 'DB_File', $filename, O_RDWR|O_CREAT, 0777, $DB_BTREE
1652         or die "Cannot tie $filename: $!" ;
1653
1654     # this line will modify the cursor
1655     $count = scalar keys %x ;
1656
1657     # Get the first key/value pair and set  the cursor
1658     $X->seq($key, $value, R_FIRST) ;
1659
1660     # Get the second key/value pair.
1661     # worked this time.
1662     $X->seq($key, $value, R_NEXT) ;
1663
1664 =back
1665
1666 All the constants defined in L<dbopen> for use in the flags parameters
1667 in the methods defined below are also available. Refer to the Berkeley
1668 DB documentation for the precise meaning of the flags values.
1669
1670 Below is a list of the methods available.
1671
1672 =over 5
1673
1674 =item B<$status = $X-E<gt>get($key, $value [, $flags]) ;>
1675
1676 Given a key (C<$key>) this method reads the value associated with it
1677 from the database. The value read from the database is returned in the
1678 C<$value> parameter.
1679
1680 If the key does not exist the method returns 1.
1681
1682 No flags are currently defined for this method.
1683
1684 =item B<$status = $X-E<gt>put($key, $value [, $flags]) ;>
1685
1686 Stores the key/value pair in the database.
1687
1688 If you use either the R_IAFTER or R_IBEFORE flags, the C<$key> parameter
1689 will have the record number of the inserted key/value pair set.
1690
1691 Valid flags are R_CURSOR, R_IAFTER, R_IBEFORE, R_NOOVERWRITE and
1692 R_SETCURSOR.
1693
1694 =item B<$status = $X-E<gt>del($key [, $flags]) ;>
1695
1696 Removes all key/value pairs with key C<$key> from the database.
1697
1698 A return code of 1 means that the requested key was not in the
1699 database.
1700
1701 R_CURSOR is the only valid flag at present.
1702
1703 =item B<$status = $X-E<gt>fd ;>
1704
1705 Returns the file descriptor for the underlying database.
1706
1707 See L<Locking: The Trouble with fd> for an explanation for why you should
1708 not use C<fd> to lock your database.
1709
1710 =item B<$status = $X-E<gt>seq($key, $value, $flags) ;>
1711
1712 This interface allows sequential retrieval from the database. See
1713 L<dbopen> for full details.
1714
1715 Both the C<$key> and C<$value> parameters will be set to the key/value
1716 pair read from the database.
1717
1718 The flags parameter is mandatory. The valid flag values are R_CURSOR,
1719 R_FIRST, R_LAST, R_NEXT and R_PREV.
1720
1721 =item B<$status = $X-E<gt>sync([$flags]) ;>
1722
1723 Flushes any cached buffers to disk.
1724
1725 R_RECNOSYNC is the only valid flag at present.
1726
1727 =back
1728
1729 =head1 DBM FILTERS
1730
1731 A DBM Filter is a piece of code that is be used when you I<always>
1732 want to make the same transformation to all keys and/or values in a
1733 DBM database.
1734
1735 There are four methods associated with DBM Filters. All work identically,
1736 and each is used to install (or uninstall) a single DBM Filter. Each
1737 expects a single parameter, namely a reference to a sub. The only
1738 difference between them is the place that the filter is installed.
1739
1740 To summarise:
1741
1742 =over 5
1743
1744 =item B<filter_store_key>
1745
1746 If a filter has been installed with this method, it will be invoked
1747 every time you write a key to a DBM database.
1748
1749 =item B<filter_store_value>
1750
1751 If a filter has been installed with this method, it will be invoked
1752 every time you write a value to a DBM database.
1753
1754
1755 =item B<filter_fetch_key>
1756
1757 If a filter has been installed with this method, it will be invoked
1758 every time you read a key from a DBM database.
1759
1760 =item B<filter_fetch_value>
1761
1762 If a filter has been installed with this method, it will be invoked
1763 every time you read a value from a DBM database.
1764
1765 =back
1766
1767 You can use any combination of the methods, from none, to all four.
1768
1769 All filter methods return the existing filter, if present, or C<undef>
1770 in not.
1771
1772 To delete a filter pass C<undef> to it.
1773
1774 =head2 The Filter
1775
1776 When each filter is called by Perl, a local copy of C<$_> will contain
1777 the key or value to be filtered. Filtering is achieved by modifying
1778 the contents of C<$_>. The return code from the filter is ignored.
1779
1780 =head2 An Example -- the NULL termination problem.
1781
1782 Consider the following scenario. You have a DBM database
1783 that you need to share with a third-party C application. The C application
1784 assumes that I<all> keys and values are NULL terminated. Unfortunately
1785 when Perl writes to DBM databases it doesn't use NULL termination, so
1786 your Perl application will have to manage NULL termination itself. When
1787 you write to the database you will have to use something like this:
1788
1789     $hash{"$key\0"} = "$value\0" ;
1790
1791 Similarly the NULL needs to be taken into account when you are considering
1792 the length of existing keys/values.
1793
1794 It would be much better if you could ignore the NULL terminations issue
1795 in the main application code and have a mechanism that automatically
1796 added the terminating NULL to all keys and values whenever you write to
1797 the database and have them removed when you read from the database. As I'm
1798 sure you have already guessed, this is a problem that DBM Filters can
1799 fix very easily.
1800
1801     use warnings ;
1802     use strict ;
1803     use DB_File ;
1804
1805     my %hash ;
1806     my $filename = "/tmp/filt" ;
1807     unlink $filename ;
1808
1809     my $db = tie %hash, 'DB_File', $filename, O_CREAT|O_RDWR, 0666, $DB_HASH
1810       or die "Cannot open $filename: $!\n" ;
1811
1812     # Install DBM Filters
1813     $db->filter_fetch_key  ( sub { s/\0$//    } ) ;
1814     $db->filter_store_key  ( sub { $_ .= "\0" } ) ;
1815     $db->filter_fetch_value( sub { s/\0$//    } ) ;
1816     $db->filter_store_value( sub { $_ .= "\0" } ) ;
1817
1818     $hash{"abc"} = "def" ;
1819     my $a = $hash{"ABC"} ;
1820     # ...
1821     undef $db ;
1822     untie %hash ;
1823
1824 Hopefully the contents of each of the filters should be
1825 self-explanatory. Both "fetch" filters remove the terminating NULL,
1826 and both "store" filters add a terminating NULL.
1827
1828
1829 =head2 Another Example -- Key is a C int.
1830
1831 Here is another real-life example. By default, whenever Perl writes to
1832 a DBM database it always writes the key and value as strings. So when
1833 you use this:
1834
1835     $hash{12345} = "soemthing" ;
1836
1837 the key 12345 will get stored in the DBM database as the 5 byte string
1838 "12345". If you actually want the key to be stored in the DBM database
1839 as a C int, you will have to use C<pack> when writing, and C<unpack>
1840 when reading.
1841
1842 Here is a DBM Filter that does it:
1843
1844     use warnings ;
1845     use strict ;
1846     use DB_File ;
1847     my %hash ;
1848     my $filename = "/tmp/filt" ;
1849     unlink $filename ;
1850
1851
1852     my $db = tie %hash, 'DB_File', $filename, O_CREAT|O_RDWR, 0666, $DB_HASH
1853       or die "Cannot open $filename: $!\n" ;
1854
1855     $db->filter_fetch_key  ( sub { $_ = unpack("i", $_) } ) ;
1856     $db->filter_store_key  ( sub { $_ = pack ("i", $_) } ) ;
1857     $hash{123} = "def" ;
1858     # ...
1859     undef $db ;
1860     untie %hash ;
1861
1862 This time only two filters have been used -- we only need to manipulate
1863 the contents of the key, so it wasn't necessary to install any value
1864 filters.
1865
1866 =head1 HINTS AND TIPS
1867
1868
1869 =head2 Locking: The Trouble with fd
1870
1871 Until version 1.72 of this module, the recommended technique for locking
1872 B<DB_File> databases was to flock the filehandle returned from the "fd"
1873 function. Unfortunately this technique has been shown to be fundamentally
1874 flawed (Kudos to David Harris for tracking this down). Use it at your own
1875 peril!
1876
1877 The locking technique went like this.
1878
1879     $db = tie(%db, 'DB_File', '/tmp/foo.db', O_CREAT|O_RDWR, 0666)
1880         || die "dbcreat /tmp/foo.db $!";
1881     $fd = $db->fd;
1882     open(DB_FH, "+<&=$fd") || die "dup $!";
1883     flock (DB_FH, LOCK_EX) || die "flock: $!";
1884     ...
1885     $db{"Tom"} = "Jerry" ;
1886     ...
1887     flock(DB_FH, LOCK_UN);
1888     undef $db;
1889     untie %db;
1890     close(DB_FH);
1891
1892 In simple terms, this is what happens:
1893
1894 =over 5
1895
1896 =item 1.
1897
1898 Use "tie" to open the database.
1899
1900 =item 2.
1901
1902 Lock the database with fd & flock.
1903
1904 =item 3.
1905
1906 Read & Write to the database.
1907
1908 =item 4.
1909
1910 Unlock and close the database.
1911
1912 =back
1913
1914 Here is the crux of the problem. A side-effect of opening the B<DB_File>
1915 database in step 2 is that an initial block from the database will get
1916 read from disk and cached in memory.
1917
1918 To see why this is a problem, consider what can happen when two processes,
1919 say "A" and "B", both want to update the same B<DB_File> database
1920 using the locking steps outlined above. Assume process "A" has already
1921 opened the database and has a write lock, but it hasn't actually updated
1922 the database yet (it has finished step 2, but not started step 3 yet). Now
1923 process "B" tries to open the same database - step 1 will succeed,
1924 but it will block on step 2 until process "A" releases the lock. The
1925 important thing to notice here is that at this point in time both
1926 processes will have cached identical initial blocks from the database.
1927
1928 Now process "A" updates the database and happens to change some of the
1929 data held in the initial buffer. Process "A" terminates, flushing
1930 all cached data to disk and releasing the database lock. At this point
1931 the database on disk will correctly reflect the changes made by process
1932 "A".
1933
1934 With the lock released, process "B" can now continue. It also updates the
1935 database and unfortunately it too modifies the data that was in its
1936 initial buffer. Once that data gets flushed to disk it will overwrite
1937 some/all of the changes process "A" made to the database.
1938
1939 The result of this scenario is at best a database that doesn't contain
1940 what you expect. At worst the database will corrupt.
1941
1942 The above won't happen every time competing process update the same
1943 B<DB_File> database, but it does illustrate why the technique should
1944 not be used.
1945
1946 =head2 Safe ways to lock a database
1947
1948 Starting with version 2.x, Berkeley DB  has internal support for locking.
1949 The companion module to this one, B<BerkeleyDB>, provides an interface
1950 to this locking functionality. If you are serious about locking
1951 Berkeley DB databases, I strongly recommend using B<BerkeleyDB>.
1952
1953 If using B<BerkeleyDB> isn't an option, there are a number of modules
1954 available on CPAN that can be used to implement locking. Each one
1955 implements locking differently and has different goals in mind. It is
1956 therefore worth knowing the difference, so that you can pick the right
1957 one for your application. Here are the three locking wrappers:
1958
1959 =over 5
1960
1961 =item B<Tie::DB_Lock>
1962
1963 A B<DB_File> wrapper which creates copies of the database file for
1964 read access, so that you have a kind of a multiversioning concurrent read
1965 system. However, updates are still serial. Use for databases where reads
1966 may be lengthy and consistency problems may occur.
1967
1968 =item B<Tie::DB_LockFile>
1969
1970 A B<DB_File> wrapper that has the ability to lock and unlock the database
1971 while it is being used. Avoids the tie-before-flock problem by simply
1972 re-tie-ing the database when you get or drop a lock.  Because of the
1973 flexibility in dropping and re-acquiring the lock in the middle of a
1974 session, this can be massaged into a system that will work with long
1975 updates and/or reads if the application follows the hints in the POD
1976 documentation.
1977
1978 =item B<DB_File::Lock>
1979
1980 An extremely lightweight B<DB_File> wrapper that simply flocks a lockfile
1981 before tie-ing the database and drops the lock after the untie. Allows
1982 one to use the same lockfile for multiple databases to avoid deadlock
1983 problems, if desired. Use for databases where updates are reads are
1984 quick and simple flock locking semantics are enough.
1985
1986 =back
1987
1988 =head2 Sharing Databases With C Applications
1989
1990 There is no technical reason why a Berkeley DB database cannot be
1991 shared by both a Perl and a C application.
1992
1993 The vast majority of problems that are reported in this area boil down
1994 to the fact that C strings are NULL terminated, whilst Perl strings are
1995 not. See L<DBM FILTERS> for a generic way to work around this problem.
1996
1997 Here is a real example. Netscape 2.0 keeps a record of the locations you
1998 visit along with the time you last visited them in a DB_HASH database.
1999 This is usually stored in the file F<~/.netscape/history.db>. The key
2000 field in the database is the location string and the value field is the
2001 time the location was last visited stored as a 4 byte binary value.
2002
2003 If you haven't already guessed, the location string is stored with a
2004 terminating NULL. This means you need to be careful when accessing the
2005 database.
2006
2007 Here is a snippet of code that is loosely based on Tom Christiansen's
2008 I<ggh> script (available from your nearest CPAN archive in
2009 F<authors/id/TOMC/scripts/nshist.gz>).
2010
2011     use warnings ;
2012     use strict ;
2013     use DB_File ;
2014     use Fcntl ;
2015
2016     my ($dotdir, $HISTORY, %hist_db, $href, $binary_time, $date) ;
2017     $dotdir = $ENV{HOME} || $ENV{LOGNAME};
2018
2019     $HISTORY = "$dotdir/.netscape/history.db";
2020
2021     tie %hist_db, 'DB_File', $HISTORY
2022         or die "Cannot open $HISTORY: $!\n" ;;
2023
2024     # Dump the complete database
2025     while ( ($href, $binary_time) = each %hist_db ) {
2026
2027         # remove the terminating NULL
2028         $href =~ s/\x00$// ;
2029
2030         # convert the binary time into a user friendly string
2031         $date = localtime unpack("V", $binary_time);
2032         print "$date $href\n" ;
2033     }
2034
2035     # check for the existence of a specific key
2036     # remember to add the NULL
2037     if ( $binary_time = $hist_db{"http://mox.perl.com/\x00"} ) {
2038         $date = localtime unpack("V", $binary_time) ;
2039         print "Last visited mox.perl.com on $date\n" ;
2040     }
2041     else {
2042         print "Never visited mox.perl.com\n"
2043     }
2044
2045     untie %hist_db ;
2046
2047 =head2 The untie() Gotcha
2048
2049 If you make use of the Berkeley DB API, it is I<very> strongly
2050 recommended that you read L<perltie/The untie Gotcha>.
2051
2052 Even if you don't currently make use of the API interface, it is still
2053 worth reading it.
2054
2055 Here is an example which illustrates the problem from a B<DB_File>
2056 perspective:
2057
2058     use DB_File ;
2059     use Fcntl ;
2060
2061     my %x ;
2062     my $X ;
2063
2064     $X = tie %x, 'DB_File', 'tst.fil' , O_RDWR|O_TRUNC
2065         or die "Cannot tie first time: $!" ;
2066
2067     $x{123} = 456 ;
2068
2069     untie %x ;
2070
2071     tie %x, 'DB_File', 'tst.fil' , O_RDWR|O_CREAT
2072         or die "Cannot tie second time: $!" ;
2073
2074     untie %x ;
2075
2076 When run, the script will produce this error message:
2077
2078     Cannot tie second time: Invalid argument at bad.file line 14.
2079
2080 Although the error message above refers to the second tie() statement
2081 in the script, the source of the problem is really with the untie()
2082 statement that precedes it.
2083
2084 Having read L<perltie> you will probably have already guessed that the
2085 error is caused by the extra copy of the tied object stored in C<$X>.
2086 If you haven't, then the problem boils down to the fact that the
2087 B<DB_File> destructor, DESTROY, will not be called until I<all>
2088 references to the tied object are destroyed. Both the tied variable,
2089 C<%x>, and C<$X> above hold a reference to the object. The call to
2090 untie() will destroy the first, but C<$X> still holds a valid
2091 reference, so the destructor will not get called and the database file
2092 F<tst.fil> will remain open. The fact that Berkeley DB then reports the
2093 attempt to open a database that is already open via the catch-all
2094 "Invalid argument" doesn't help.
2095
2096 If you run the script with the C<-w> flag the error message becomes:
2097
2098     untie attempted while 1 inner references still exist at bad.file line 12.
2099     Cannot tie second time: Invalid argument at bad.file line 14.
2100
2101 which pinpoints the real problem. Finally the script can now be
2102 modified to fix the original problem by destroying the API object
2103 before the untie:
2104
2105     ...
2106     $x{123} = 456 ;
2107
2108     undef $X ;
2109     untie %x ;
2110
2111     $X = tie %x, 'DB_File', 'tst.fil' , O_RDWR|O_CREAT
2112     ...
2113
2114
2115 =head1 COMMON QUESTIONS
2116
2117 =head2 Why is there Perl source in my database?
2118
2119 If you look at the contents of a database file created by DB_File,
2120 there can sometimes be part of a Perl script included in it.
2121
2122 This happens because Berkeley DB uses dynamic memory to allocate
2123 buffers which will subsequently be written to the database file. Being
2124 dynamic, the memory could have been used for anything before DB
2125 malloced it. As Berkeley DB doesn't clear the memory once it has been
2126 allocated, the unused portions will contain random junk. In the case
2127 where a Perl script gets written to the database, the random junk will
2128 correspond to an area of dynamic memory that happened to be used during
2129 the compilation of the script.
2130
2131 Unless you don't like the possibility of there being part of your Perl
2132 scripts embedded in a database file, this is nothing to worry about.
2133
2134 =head2 How do I store complex data structures with DB_File?
2135
2136 Although B<DB_File> cannot do this directly, there is a module which
2137 can layer transparently over B<DB_File> to accomplish this feat.
2138
2139 Check out the MLDBM module, available on CPAN in the directory
2140 F<modules/by-module/MLDBM>.
2141
2142 =head2 What does "Invalid Argument" mean?
2143
2144 You will get this error message when one of the parameters in the
2145 C<tie> call is wrong. Unfortunately there are quite a few parameters to
2146 get wrong, so it can be difficult to figure out which one it is.
2147
2148 Here are a couple of possibilities:
2149
2150 =over 5
2151
2152 =item 1.
2153
2154 Attempting to reopen a database without closing it.
2155
2156 =item 2.
2157
2158 Using the O_WRONLY flag.
2159
2160 =back
2161
2162 =head2 What does "Bareword 'DB_File' not allowed" mean?
2163
2164 You will encounter this particular error message when you have the
2165 C<strict 'subs'> pragma (or the full strict pragma) in your script.
2166 Consider this script:
2167
2168     use warnings ;
2169     use strict ;
2170     use DB_File ;
2171     my %x ;
2172     tie %x, DB_File, "filename" ;
2173
2174 Running it produces the error in question:
2175
2176     Bareword "DB_File" not allowed while "strict subs" in use
2177
2178 To get around the error, place the word C<DB_File> in either single or
2179 double quotes, like this:
2180
2181     tie %x, "DB_File", "filename" ;
2182
2183 Although it might seem like a real pain, it is really worth the effort
2184 of having a C<use strict> in all your scripts.
2185
2186 =head1 REFERENCES
2187
2188 Articles that are either about B<DB_File> or make use of it.
2189
2190 =over 5
2191
2192 =item 1.
2193
2194 I<Full-Text Searching in Perl>, Tim Kientzle (tkientzle@ddj.com),
2195 Dr. Dobb's Journal, Issue 295, January 1999, pp 34-41
2196
2197 =back
2198
2199 =head1 HISTORY
2200
2201 Moved to the Changes file.
2202
2203 =head1 BUGS
2204
2205 Some older versions of Berkeley DB had problems with fixed length
2206 records using the RECNO file format. This problem has been fixed since
2207 version 1.85 of Berkeley DB.
2208
2209 I am sure there are bugs in the code. If you do find any, or can
2210 suggest any enhancements, I would welcome your comments.
2211
2212 =head1 AVAILABILITY
2213
2214 B<DB_File> comes with the standard Perl source distribution. Look in
2215 the directory F<ext/DB_File>. Given the amount of time between releases
2216 of Perl the version that ships with Perl is quite likely to be out of
2217 date, so the most recent version can always be found on CPAN (see
2218 L<perlmod/CPAN> for details), in the directory
2219 F<modules/by-module/DB_File>.
2220
2221 This version of B<DB_File> will work with either version 1.x, 2.x or
2222 3.x of Berkeley DB, but is limited to the functionality provided by
2223 version 1.
2224
2225 The official web site for Berkeley DB is F<http://www.sleepycat.com>.
2226 All versions of Berkeley DB are available there.
2227
2228 Alternatively, Berkeley DB version 1 is available at your nearest CPAN
2229 archive in F<src/misc/db.1.85.tar.gz>.
2230
2231 If you are running IRIX, then get Berkeley DB version 1 from
2232 F<http://reality.sgi.com/ariel>. It has the patches necessary to
2233 compile properly on IRIX 5.3.
2234
2235 =head1 COPYRIGHT
2236
2237 Copyright (c) 1995-2002 Paul Marquess. All rights reserved. This program
2238 is free software; you can redistribute it and/or modify it under the
2239 same terms as Perl itself.
2240
2241 Although B<DB_File> is covered by the Perl license, the library it
2242 makes use of, namely Berkeley DB, is not. Berkeley DB has its own
2243 copyright and its own license. Please take the time to read it.
2244
2245 Here are are few words taken from the Berkeley DB FAQ (at
2246 F<http://www.sleepycat.com>) regarding the license:
2247
2248     Do I have to license DB to use it in Perl scripts?
2249
2250     No. The Berkeley DB license requires that software that uses
2251     Berkeley DB be freely redistributable. In the case of Perl, that
2252     software is Perl, and not your scripts. Any Perl scripts that you
2253     write are your property, including scripts that make use of
2254     Berkeley DB. Neither the Perl license nor the Berkeley DB license
2255     place any restriction on what you may do with them.
2256
2257 If you are in any doubt about the license situation, contact either the
2258 Berkeley DB authors or the author of DB_File. See L<"AUTHOR"> for details.
2259
2260
2261 =head1 SEE ALSO
2262
2263 L<perl(1)>, L<dbopen(3)>, L<hash(3)>, L<recno(3)>, L<btree(3)>,
2264 L<dbmfilter>
2265
2266 =head1 AUTHOR
2267
2268 The DB_File interface was written by Paul Marquess
2269 E<lt>Paul.Marquess@btinternet.comE<gt>.
2270 Questions about the DB system itself may be addressed to
2271 E<lt>db@sleepycat.com<gt>.
2272
2273 =cut