File Coverage

blib/lib/Boulder/Store.pm

Criterion	Covered	Total	%
statement	10	12	83.3
branch			n/a
condition			n/a
subroutine	4	4	100.0
pod			n/a
total	14	16	87.5

line	stmt	sub	time	code
1				# $Id: Store.pm,v 1.6 2002/06/28 20:31:59 lstein Exp $
2
3				# Prototype support library for storing Boulder streams.
4				# Basic design is as follows:
5				# The "data" file, named .records contains
6				# a recno style data file. Records are delimited by
7				# newlines. Each record has this form:
8
9				# tag=long string value&tag=long string value...
10				# Subrecords are delimited by {} pairs as per the
11				# usual boulderio format.
12
13				# The "index" file, named .index, is a DB_Hash
14				# that contains several things:
15				# 1. Indexes. The key is used to translate
16				# from index to the list of record entries.
17				# 2. Other information:
18				# .INDICES -- list of tags that are indexed.
19
20				package Boulder::Store;
21
22				=head1 NAME
23
24				Boulder::Store - Simple persistent storage for Stone tag/value objects
25
26				=head1 SYNOPSIS
27
28				Boulder:Store;
29
30				my $store=new Boulder::Store('test.db',1);
31				my $s = new Stone (Name=>'george',
32				Age=>23,
33				Sex=>M,
34				Address=>{
35				Street=>'29 Rockland drive',
36				Town=>'Fort Washington',
37				ZIP=>'77777'
38				}
39				);
40				$store->put($s);
41				$store->put(new Stone(Name=>'fred',
42				Age=>30,
43				Sex=>M,
44				Address=>{
45				Street=>'19 Gravel Path',
46				Town=>'Bedrock',
47				ZIP=>'12345'},
48				Phone=>{
49				Day=>'111-1111',
50				Eve=>'222-2222'
51				}
52				));
53				$store->put(new Stone(Name=>'andrew',
54				Age=>18,
55				Sex=>M));
56
57				$store->add_index('Name');
58
59				my $stone = $store->get(0);
60				print "name = ",$stone->Name;
61
62				=head1 DESCRIPTION
63
64				Boulder::Store provides persistent storage for Boulder objects using a
65				simple DB_File implementation. To use it, you need to have Berkeley
66				db installed (also known as libdb), and the Perl DB_File module. See
67				the DB_File package for more details on obtaining Berkeley db if you
68				do not already have it.
69
70				Boulder::Store provides an unsophisticated query mechanism which takes
71				advantage of indexes that you specify. Despite its lack of
72				sophistication, the query system is often very helpful.
73
74				=head1 CLASS METHODS
75
76				=over 4
77
78				=item $store = Boulder::Store->new("database/path",$writable)
79
80				The B method creates a new Boulder::Store object and associates
81				it with the database file provided in the first parameter (undef is a
82				valid pathname, in which case all methods work but the data isn't
83				stored). The second parameter should be a B value if you want
84				to open the database for writing. Otherwise it's opened read only.
85
86				Because the underlying storage implementation is not multi-user, only
87				one process can have the database for writing at a time. A
88				B-based locking mechanism is used to give a process that has
89				the database opened for writing exclusive access to the database.
90				This also prevents the database from being opened for reading while
91				another process is writing to it (this is a B thing). Multiple
92				simultaneous processes can open the database read only.
93
94				Physically the data is stored in a human-readable file with the
95				extension ".data".
96
97				=back
98
99				=head1 OBJECT METHODS
100
101				=over 4
102
103				=item $stone = $store->read_record(@taglist)
104
105				The semantics of this call are exactly the same as in
106				B. Stones are returned in sequential order, starting
107				with the first record. In addition to their built-in tags, each stone
108				returned from this call has an additional tag called "record_no".
109				This is the zero-based record number of the stone in the database.
110				Use the B method to begin iterating from the beginning of the
111				database.
112
113				If called in an array context, B returns a list of all
114				stones in the database that contains one or more of the provided tags.
115
116				=item $stone = $store->write_record($stone [,$index])
117
118				This has the same semantics as B. A stone is
119				appended to the end of the database. If successful, this call returns
120				the record number of the new entry. By providing an optional second
121				parameter, you can control where the stone is entered. A positive
122				numeric index will write the stone into the database at that position.
123				A value of -1 will use the Stone's internal record number (if present)
124				to determine where to place it.
125
126				=item $stone = $store->get($record_no)
127
128				This is random access to the database. Provide a record number and
129				this call will return the stone stored at that position.
130
131				=item $record_number = $store->put($stone,$record_no)
132
133				This is a random write to the database. Provide a record number and
134				this call stores the stone at the indicated position, replacing whatever
135				was there before.
136
137				If no record number is provided, this call will look for the presence
138				of a 'record_no' tag in the stone itself and put it back in that
139				position. This allows you to pull a stone out of the database, modify
140				it, and then put it back in without worrying about its record number.
141				If no record is found in the stone, then the effect is identical to
142				write_record().
143
144				The record number of the inserted stone is returned from this call, or
145				-1 if an error occurred.
146
147				=item $store->delete($stone),Boulder::Store::delete($record_no)
148
149				These method calls delete a stone from the database. You can provide
150				either the record number or a stone containing the 'record_no' tag.
151				B: if the database is heavily indexed deletes can be
152				time-consuming as it requires the index to be brought back into synch.
153
154				=item $record_count = $store->length()
155
156				This returns the length of the database, in records.
157
158				=item $store->reset()
159
160				This resets the database, nullifying any queries in effect, and
161				causing read_record() to begin fetching stones from the first record.
162
163				=item $store->query(%query_array)
164
165				This creates a query on the database used for selecting stones in
166				B. The query is an associative array. Three types of
167				keys/value pairs are allowed:
168
169				=over 4
170
171				=item (1) $index=>$value
172
173				This instructs Boulder::Store to look for stones containing the
174				specified tags in which the tag's value (determined by the Stone
175				B method) exactly matches the provided
176				value. Example:
177
178				$db->query('STS.left_primer.length'=>30);
179
180				Only the non-bracketed forms of the index string are allowed (this
181				is probably a bug...)
182
183				If the tag path was declared to be an index, then this search
184				will be fast. Otherwise Boulder::Store must iterate over every
185				record in the database.
186
187				=item (2) EVAL=>'expression'
188
189				This instructs Boulder::Store to look for stones in which the
190				provided expression evaluates to B. When the expression
191				is evaluated, the variable B<$s> will be set to the current
192				record's stone. As a shortcut, you can use ""
193				as shorthand for "$s->index('index.string')".
194
195				=item (3) EVAL=>['expression1','expression2','expression3'...]
196
197				This lets you provide a whole bunch of expressions, and is exactly
198				equivalent to EVAL=>'(expression1) && (expression2) && (expression3)'.
199
200				=back
201
202				You can mix query types in the parameter provided to B.
203				For example, here's how to look up all stones in which the sex is
204				male and the age is greater than 30:
205
206				$db->query('sex'=>'M',EVAL=>' > 30');
207
208				When a query is in effect, B returns only Stones
209				that satisfy the query. In an array context, B
210				returns a list of all Stones that satisfy the query. When no
211				more satisfactory Stones are found, B returns
212				B until a new query is entered or B is called.
213
214				=item $store->add_index(@indices)
215
216				Declare one or more tag paths to be a part of a fast index.
217				B will take advantage of this record when processing
218				queries. For example:
219
220				$db->add_index('age','sex','person.pets');
221
222				You can add indexes any time you like, when the database is first
223				created or later. There is a trade off: B,
224				B, and other data-modifying calls will become slower as
225				more indexes are added.
226
227				The index is stored in an external file with the extension ".index".
228				An index file is created even if you haven't indexed any tags.
229
230				=item $store->reindex_all()
231
232				Call this if the index gets screwed up (or lost). It rebuilds it
233				from scratch.
234
235				=back
236
237				=head1 CAVEATS
238
239				Boulder::Store makes heavy use of the flock() call in order to avoid
240				corruption of DB_File databases when multiple processes try to write
241				simultaneously. flock() may not work correctly across NFS mounts,
242				particularly on Linux machines that are not running the rpc.lockd
243				daemon. Please confirm that your flock() works across NFS before
244				attempting to use Boulder::Store. If the store.t test hangs during
245				testing, this is the likely culprit.
246
247				=head1 AUTHOR
248
249				Lincoln D. Stein , Cold Spring Harbor Laboratory,
250				Cold Spring Harbor, NY. This module can be used and distributed on
251				the same terms as Perl itself.
252
253				=head1 SEE ALSO
254
255				L, L, L
256
257				=cut
258
259	1	1	4182	use Boulder::Stream;
	1		5
	1		39
260	1	1	5	use Carp;
	1		2
	1		78
261	1	1	6	use Fcntl;
	1		1
	1		303
262	1	1	1793	use DB_File;
	0
	0
263
264				$VERSION = '1.20';
265
266				@ISA = 'Boulder::Stream';
267				$lockfh='lock00000';
268				$LOCK_SH = 1;
269				$LOCK_EX = 2;
270				$LOCK_UN = 8;
271
272				# Override the old new() method.
273				# There is no passthrough behavior in the database version,
274				# because this is usually undesirable.
275				# In this case,$in is the pathname to the database to open.
276				sub new {
277				my($package,$in,$writable) = @_;
278				my $self = bless {
279				'records'=>undef, # filled in by _open_databases
280				'dbrecno'=>undef, # filled in by _open_databases
281				'index'=>undef, # filled in by _open_databases
282				'writable'=>$writable,
283				'basename'=>$in,
284				'passthru'=>undef,
285				'binary'=>'true',
286				'nextrecord'=>0, # next record to retrieve during iterations
287				'query_records'=>undef, # list of records during optimized queries
288				'query_test'=>undef, # an expression to apply to each record during a query
289				'IN'=>undef,
290				'OUT'=>undef,
291				'delim'=>'=',
292				'record_stop'=>"\n",
293				'line_end'=>'&',
294				'index_delim'=>' ',
295				'subrec_start'=>"\{",
296				'subrec_end'=>"\}"
297				},$package;
298				return undef unless _lock($self,'lock');
299				return _open_databases($self,$in) ? $self : undef;
300				}
301
302				sub DESTROY {
303				my $self = shift;
304				undef $self->{'dbrecno'};
305				untie %{$self->{'index'}};
306				untie @{$self->{'records'}};
307				_lock($self,'unlock');
308				}
309
310				#####################
311				# private routines
312				####################
313				# Obtain exclusive privileges if database is
314				# writable. Otherwise obtain shared privileges.
315				# Note that this call does not work across file systems,
316				# at least on non-linux systems. Should use fcntl()
317				# instead (but don't have Stevens at hand).
318				sub _lock {
319				my($self,$lockit) = @_;
320				my $in = $self->{'basename'};
321				my $lockfilename = "$in.lock";
322				if ($lockit eq 'lock') {
323				$lockfh++;
324				open($lockfh,"+>$lockfilename") \|\| return undef;
325				$self->{'lockfh'}=$lockfh;
326				return flock($lockfh,$self->{'writable'} ? $LOCK_EX : $LOCK_SH);
327				} else {
328				my $lockfh = $self->{'lockfh'};
329				unlink $lockfilename;
330				flock($lockfh,$LOCK_UN);
331				close($lockfh);
332				1;
333				}
334				}
335
336				sub _open_databases {
337				my $self = shift;
338
339				# Try to open up and/or create the recno and index files
340				my($in)=$self->{'basename'};
341				my (@records,%index);
342				my ($permissions) = $self->{'writable'} ? (O_RDWR\|O_CREAT) : O_RDONLY;
343				$self->{'dbrecno'} = tie(@records,DB_File,"$in.data",
344				$permissions,0640,$DB_RECNO) \|\| return undef;
345				tie(%index,DB_File,"$in.index",$permissions,0640,$DB_HASH) \|\| return undef;
346
347				$self->{'records'}=\@records;
348				$self->{'index'}=\%index;
349				1;
350				}
351
352				#########################################################################
353				# DELETE EVERYTHING FROM THE DATABASE
354				#########################################################################
355				sub empty {
356				my $self = shift;
357				my($base) = $self->{'basename'};
358				&DESTROY($self); # this closes the database and releases locks
359
360				# delete the files
361				foreach ('.data','.index') {
362				unlink "$base$_";
363				}
364
365				# Now reopen things
366				return _open_databases($self);
367				}
368
369				########################################################################
370				# DATA STORAGE
371				########################################################################
372				# This overrides the base object write_record.
373				# It writes the stone into the given position in the file.
374				# You can provide an index to put the record at a particular
375				# position, leave it undef to append the record to the end
376				# of the table, or provide a -1 to use the current record
377				# number of the stone to get the position. Just for fun,
378				# we return the record number of the added object.
379				sub write_record {
380				my($self,$stone,$index) = @_;
381				unless ($self->{'writable'}) {
382				warn "Attempt to write to read-only database $self->{'basename'}";
383				return undef;
384				}
385
386				my ($nextrecord);
387
388				if (defined($index) && $index == -1) {
389				my $stonepos = $stone->get('record_no');
390				$nextrecord = defined($stonepos) ? $stonepos : $self->length;
391				} else {
392				$nextrecord = (defined($index) && ($index >= 0) && ($index < $self->length))
393				? $index : $self->length;
394				}
395
396				# We figure out here what indices need to be updated
397				my %need_updating; # indexes that need fixing
398				if ($nextrecord != $self->length) {
399				my $old = $self->get($nextrecord);
400				if ($old) {
401				foreach ($self->indexed_keys) {
402				my $oldvalue = join('',$old->index($_));
403				my $newvalue = join('',$stone->index($_));
404				$need_updating{$_}++ if $oldvalue ne $newvalue;
405				}
406				}
407				$self->unindex_record($nextrecord,keys %need_updating) if %need_updating;
408				} else {
409				grep($need_updating{$_}++,$self->indexed_keys);
410				}
411
412				# Write out the Stone record.
413				$stone->replace('record_no',$nextrecord); # keep track of this please
414				my ($key,$value,@value,@lines);
415
416				foreach $key ($stone->tags) {
417				@value = $stone->get($key);
418				$key = $self->escapekey($key);
419				foreach $value (@value) {
420				if (ref $value && defined $value->{'.name'}) {
421				$value = $self->escapeval($value);
422				push(@lines,"$key$self->{delim}$value");
423				} else {
424				push(@lines,"$key$self->{delim}$self->{subrec_start}");
425				push(@lines,_write_nested($self,1,$value));
426				}
427				}
428				}
429				$self->{'records'}->[$nextrecord]=join("$self->{line_end}",@lines);
430				$self->index_record($nextrecord,keys %need_updating) if %need_updating;
431
432				$nextrecord;
433				}
434
435				# put() is an alias for write_record, except that it
436				# requires a record number.
437				sub put {
438				my($self,$stone,$record_no) = @_;
439				croak 'Usage: put($stone [,$record_no])' unless defined $stone;
440				$record_no = $stone->get('record_no') unless defined($record_no);
441				$self->write_record($stone,$record_no);
442				}
443
444				# Delete the record number from the database. You may
445				# provide either a numeric recno, or the stone itself.
446				# The deleted stone is returned (sans its record no).
447				sub delete {
448				my($self,$s) = @_;
449				my $recno;
450				if ( $s->isa('Stone') ) {
451				$recno = $s->get('record_no');
452				} else {
453				$recno = $s;
454				}
455				$self->unindex_record($recno); # remove from the index
456				$s = $self->get($recno) unless $s->isa('Stone');
457				delete $s->{recno}; # record number is gonzo
458				$self->{'dbrecno'}->del($recno); # this does the actual delete
459				$self->renumber_indices($recno);
460				$self->renumber_records($recno);
461				return $s;
462				}
463
464				########################################################################
465				# DATA RETRIEVAL
466				########################################################################
467				sub read_one_record {
468				my($self,@keywords) = @_;
469
470				return undef if $self->done;
471
472				my(%interested,$key,$value);
473				grep($interested{$_}++,@keywords);
474				$interested{'record_no'}++; # always interested in this one
475
476				my $delim=$self->{'delim'};
477				my $subrec_start=$self->{'subrec_start'};
478				my $subrec_end=$self->{'subrec_end'};
479				my ($stone,$pebble,$found);
480
481				while (1) {
482
483				undef $self->{LEVEL},last unless $_ = $self->next_pair;
484
485				if (/$subrec_end$/o) {
486				$self->{LEVEL}--,last if $self->{LEVEL};
487				next;
488				}
489
490				next unless ($key,$value) = split($self->{delim},$_);
491				$key = $self->unescapekey($key);
492				$stone = new Stone() unless $stone;
493
494				if ((!@keywords) \|\| $interested{$key}) {
495
496				$found++;
497				if ($value =~ /$subrec_start/o) {
498				$self->{LEVEL}++;
499				$pebble = read_one_record($self); # call ourselves recursively
500				$stone->insert($key=>$pebble);
501				next;
502				}
503
504				$stone->insert($key=>$self->unescapeval($value));
505				}
506				}
507
508				return undef unless $found;
509				return $stone;
510				}
511
512				# Read_record has the semantics that if a query is active,
513				# it will only return stones that satisfy the query.
514				sub read_record {
515				my($self,@tags) = @_;
516				my $query = $self->{'query_test'};
517				my $s;
518
519				if (wantarray) {
520				my(@result);
521				while (!$self->done) {
522				$s = $self->read_one_record(@tags);
523				next unless $s;
524				next if $query && !($query->($s));
525				push(@result,$s);
526				}
527				return @result;
528				} else {
529				while (!$self->done) {
530				$s = $self->read_one_record(@tags);
531				next unless $s;
532				return $s unless $query;
533				return $s if $query->($s);
534				}
535				return undef;
536				}
537				}
538
539				# Random access. This will have the interesting side effect
540				# of causing read_record() to begin iterating from this record
541				# number.
542				sub get {
543				my($self,$record,@tags) = @_;
544				$self->{'nextrecord'} = $record if defined($record);
545				undef $self->{'EOF'};
546				return $self->read_record(@tags);
547				}
548
549				# Reset database so we start iterating over the entire
550				# database at record no 0 again.
551				sub reset {
552				my $self = shift;
553				$self->{'EOF'} = undef;
554				$self->{'nextrecord'} = 0;
555				$self->{'query_test'} = undef;
556				$self->{'query_records'} = undef;
557				}
558
559				# Return the number of records in this file
560				sub length {
561				my $self = shift;
562				return $self->{'dbrecno'}->length;
563				}
564
565				# Return the number of unread query records
566				sub length_qrecs {
567				my $self = shift;
568				return $#{$self->{'query_records'}} + 1;
569				}
570
571				# Create a query. read_record() will then
572				# iterate over the query results. A query consists of
573				# an associative array of this form:
574				# index1=>value1,
575				# index2=>value2,
576				# ...
577				# indexN=>valueN,
578				# 'EVAL'=>[expression1,expression2,expression3...]
579				# 'EVAL'=>expression
580				#
581				# The index forms test for equality, and take advantage
582				# of any fast indexed keywords you've declared. For
583				# example, this will identify all white males:
584				# $db->query('Demographics.Sex'=>'M',
585				# 'Demographics.Race'=>'white');
586				#
587				# The code form allows you to retrieve Stones satisfying
588				# any arbitrary snippets of Perl code. Internally, the
589				# variable "$s" will be set to the current Stone.
590				# For example, find all whites > 30 years of age:
591				#
592				# $db->query('Demographics.Race'=>'white',
593				# 'EVAL'=>'$s->index(Age) > 30');
594				#
595				# EVAL (and "eval" too) expressions are ANDed together
596				# in the order you declare them. Internally indexed
597				# keywords are evaluated first in order to speed things up.
598
599				# A cute feature that may go away:
600				# You can use the expression as shorthand
601				# for $s->index('path.to.index')
602				sub query {
603				my($self,%query) = @_;
604				my($type,@expressions,%keylookups);
605
606				foreach $type (keys %query) {
607				if ($type =~ /^EVAL$/i) {
608				push (@expressions,$query{$type}) unless ref $query{$type};
609				push (@expressions,@{$query{$type}}) if ref $query{$type};
610				} else {
611				$keylookups{$type} = $query{$type};
612				}
613				}
614
615				# All the eval expressions are turned into a piece
616				# of perl code.
617				my $perlcode;
618				foreach (@expressions) {
619				s/<([\w.]+)>/\$s->index('$1')/g;
620				$_ = "($_)";
621				}
622
623				my %fast;
624				grep($fast{$_}++,$self->indexed_keys);
625				my %fastrecs;
626				my $fastset; # this flag keeps track of the first access to %fastrecs
627
628				foreach (keys %keylookups) {
629
630				if ($fast{$_}) {
631				my (@records) = $self->lookup($_,$keylookups{$_});
632				if ($fastset) {
633				my %tmp;
634				grep($fastrecs{$_} && $tmp{$_}++,@records);
635				%fastrecs = %tmp;
636				} else {
637				grep($fastrecs{$_}++,@records);
638				$fastset++;
639				}
640
641				} else { # slow record-by-record search
642				unshift(@expressions,"(\$s->index('$_') eq '$keylookups{$_}')");
643				}
644
645				}
646				$perlcode = 'sub { my $s = shift;' . join(' && ',@expressions) . ';}' if @expressions;
647				$perlcode = 'sub {1;}' unless @expressions;
648
649				# The next step either looks up a compiled query or
650				# creates one. We use a package global for this
651				# purpose, since the same query may be used for
652				# different databases.
653				my $coderef;
654				unless ($coderef = $QUERIES{$perlcode}) {
655				$coderef = $QUERIES{$perlcode} = eval $perlcode;
656				return undef if $@;
657				}
658
659				$self->reset; # clear out old information
660				$self->{'query_test'} = $coderef; # set us to check each record against the code
661				$self->{'query_records'} = [keys %fastrecs] if $fastset;
662				return 1;
663				}
664
665				# fetch() allows you to pass a query to the
666				# database, and get out all the stones that hit.
667				# Internally it is just a call to query() followed
668				# by an array-context call to read_record
669				sub fetch {
670				my($self,%query) = @_;
671				$self->query(%query);
672				my(@result) = $self->read_record(); # call in array context
673				return @result;
674				}
675
676				#--------------------------------------
677				# Internal (private) procedures.
678				#--------------------------------------
679				sub _write_nested {
680				my($self,$level,$stone) = @_;
681
682				my($key,$value,@value,@lines);
683
684				foreach $key ($stone->tags) {
685				@value = $stone->get($key);
686				$key = $self->escapekey($key);
687				foreach $value (@value) {
688				if (ref $value && defined $value->{'.name'}) {
689				$value = $self->escapeval($value);
690				push(@lines,"$key$self->{delim}$value");
691				} else {
692				push(@lines,"$key$self->{delim}$self->{subrec_start}");
693				push(@lines,_write_nested($self,$level+1,$value));
694				}
695				}
696				}
697
698				push(@lines,$self->{'subrec_end'});
699				return @lines;
700				}
701
702				# This finds an array of key/value pairs and
703				# stashes it where we can find it.
704				# This is overriden from the basic Boulder::Stream class,
705				# and relies on the state variable 'nextrecord' to tell
706				# it where to start reading from.
707				sub read_next_rec {
708				my($self) = @_;
709				my $data;
710
711				# two modes of retrieval:
712				# 1. regular iterate through the entire database
713				# 2. iterate through subset of records in 'query_records'
714				unless ($self->{'query_records'}) {
715				return !($self->{EOF}++) if $self->length <= $self->{'nextrecord'};
716				$data = $self->{'records'}->[$self->{'nextrecord'}];
717				$self->{'nextrecord'}++;
718				} else {
719				my $nextrecord = shift @{$self->{'query_records'}};
720				return !($self->{EOF}++) unless $nextrecord ne '';
721				$data = $self->{'records'}->[$nextrecord];
722				}
723
724				# unpack the guy into pairs
725				$self->{PAIRS}=[split($self->{'line_end'},$data)];
726				}
727
728				# This fiddles 'nextrecord' or 'query_records', as appropriate, so that
729				# the next call to read_next_rec will skip over $skip records.
730				sub skip_recs {
731				my($self,$skip) = @_;
732				unless ($self->{'query_records'}) {
733				$self->{'nextrecord'} += $skip;
734				} else {
735				splice(@{$self->{'query_records'}}, 0, $skip);
736				}
737				}
738
739				# Index a stone record
740				sub index_record {
741				my ($self,$recno,@indices) = @_;
742
743				my $s = $self->get($recno);
744				return undef unless defined($s);
745
746				my($index,@values,$value);
747				@indices = $self->indexed_keys unless @indices;
748				foreach $index (@indices) {
749				@values = $s->index($index);
750				foreach $value (@values) {
751				my %current;
752				grep($current{$_}++,split(" ",$self->{'index'}->{"$index:$value"}));
753				$current{$recno}++; # add us to the list
754				$self->{'index'}->{"$index:$value"} = join(" ",keys %current);
755				}
756				}
757				1;
758				}
759
760				# This is a NOP for now.
761				sub unindex_record {
762				my ($self,$recno,@indices) = @_;
763
764				my $s = $self->get($recno);
765				return undef unless defined($s);
766
767				my($index,@values,$value);
768				@indices = $self->indexed_keys unless @indices;
769
770				foreach $index (@indices) {
771				@values = $s->index($index);
772				foreach $value (@values) {
773				my %current;
774				grep($current{$_}++,split(" ",$self->{'index'}->{"$index:$value"}));
775				delete $current{$recno}; # remove us from the list
776				$self->{'index'}->{"$index:$value"} = join(" ",keys %current); # put index back
777				}
778				}
779				1;
780				};
781
782				# This gets called after a record delete, when all the indexes need to be
783				# shifted downwards -- this is probably WAY slow.
784				sub renumber_indices {
785				my ($self,$deleted_recno) = @_;
786				while (($key,$value) = each %{$self->{'index'}}) {
787				next if $key =~/^\./;
788				@values = split(" ",$value);
789				foreach (@values) {
790				$_-- if $_ > $deleted_recno;
791				}
792				# This will probably put us into an infinite loop!
793				$self->{'index'}->{$key} = join(" ",@values);
794				}
795				}
796
797				# This also gets called after a record delete, when all the indexes need to be
798				# shifted downwards -- this is probably WAY slow.
799				sub renumber_records {
800				my ($self,$deleted_recno) = @_;
801				$self->reset;
802				$recno = -1;
803				while ($s=$self->read_record) {
804				$recno++;
805				next unless $s->get('record_no') > $deleted_recno;
806				$s->replace('record_no',$recno);
807				$self->put($s);
808				}
809				}
810
811				# Look up a stone record using its index. Will return a list
812				# of the matching records
813				sub lookup {
814				my ($self,$index,$value) = @_;
815				my %records;
816				grep($records{$_}++,split(" ",$self->{'index'}->{"$index:$value"}));
817				return keys %records;
818				}
819
820				# Add an index (or list of indices) to the database.
821				# If new, then we do a reindexing.
822				sub add_index {
823				my ($self,@indices) = @_;
824				my (%oldindices);
825				grep($oldindices{$_}++,$self->indexed_keys);
826				my (@newindices) = grep(!$oldindices{$_},@indices);
827				$self->reindex_some_keys(@newindices);
828				$self->{'index'}->{'.INDICES'}=join($self->{'index_delim'},keys %oldindices,@newindices);
829				}
830
831				# Return the indexed keys as an associative array (convenient)
832				sub indexed_keys {
833				my $self = shift;
834				return split($self->{'index_delim'},$self->{'index'}->{'.INDICES'});
835				}
836
837				# Reindex all records that contain records involving the provided indices.
838				sub reindex_some_keys {
839				my($self,@new) = @_;
840				my ($s,$index,$value);
841				$self->reset; # reset to beginning of database
842
843				while ($s=$self->read_record) { # return all the stones
844				foreach $index (@new) {
845				foreach $value ($s->index($index)){ # pull out all the values at this index (if any)
846				my %current;
847				grep($current{$_}++,split(" ",$self->{'index'}->{"$index:$value"}));
848				$current{$s->get('record_no')}++;
849				$self->{'index'}->{"$index:$value"}=join(" ",keys %current);
850				}
851				}
852				}
853
854				}
855
856				# Completely rebuild the index.
857				sub reindex_all {
858				my $self = shift;
859				my ($index,$s,@values,$value);
860				$self->reset;
861				foreach $index ($self->indexed_keys) {
862				undef %records;
863				while ($s=$self->read_record) { # return all the stones
864				foreach $value ($s->index($index)){ # pull out all the values at this index (if any)
865				$records{"$index:$value"}->{$s->get('record_no')}++;
866				}
867				}
868				foreach (keys %records) {
869				$self->{'index'}->{$_}=join(" ",keys %{$records{$_}});
870				}
871				}
872				}
873
874
875				1;