source: main/trunk/greenstone2/perllib/dbutil.pm@ 30356

Last change on this file since 30356 was 30356, checked in by jmt12, 8 years ago

Complete rewrite of dbutil.pm to (rather than have databases hardcoded) use a dynamic object-oriented loading system.

File size: 15.3 KB
RevLine 
[30356]1###############################################################################
[15699]2#
[30356]3# dbutil.pm -- functions to handle using dbdrivers
[15699]4#
[30356]5# Copyright (c) 2015 New Zealand Digital Library Project
[15699]6#
[30356]7# A component of the Greenstone digital library software from the New Zealand
8# Digital Library Project at the University of Waikato, New Zealand.
[15699]9#
[30356]10# This program is free software; you can redistribute it and/or modify it under
11# the terms of the GNU General Public License as published by the Free Software
12# Foundation; either version 2 of the License, or (at your option) any later
13# version.
[15699]14#
[30356]15# This program is distributed in the hope that it will be useful, but WITHOUT
16# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
17# FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
18# details.
[15699]19#
[30356]20# You should have received a copy of the GNU General Public License along with
21# this program; if not, write to the Free Software Foundation, Inc., 675 Mass
22# Ave, Cambridge, MA 02139, USA.
23#
24###############################################################################
[15699]25
26package dbutil;
27
[30356]28# Pragma
[15699]29use strict;
30
[30356]31# DEBUGGING: You can enable a DBDriver one at a time to ensure they don't have
32# compilation errors.
33BEGIN
34{
35 if (!defined $ENV{'GSDLHOME'} || !defined $ENV{'GSDLOS'}) {
36 die("Error! Environment not prepared. Have you sourced setup.bash?\n");
37 }
38 # Are we running standalone? In which case the INC won't be correct
39 my $perllib_path = $ENV{'GSDLHOME'} . '/perllib';
40 my $all_inc = join(':', @INC);
41 if ($all_inc !~ /$perllib_path/) {
42 unshift(@INC, $perllib_path);
43 unshift(@INC, $ENV{'GSDLHOME'} . '/ext/parallel-building/perllib');
44 unshift(@INC, $ENV{'GSDLHOME'} . '/ext/tdb/perllib');
45 }
46 ## You can uncomment and name a Driver here to test it compiles
47 #require DBDrivers::TDBCLUSTER;
48 #my $driver = DBDrivers::TDBCLUSTER->new(1);
49}
[15699]50
[30356]51# Libraries
52use Devel::Peek;
53use Time::HiRes qw ( gettimeofday tv_interval );
54use FileUtils;
55use gsprintf 'gsprintf';
56use util;
57
58# Modulino pattern
59__PACKAGE__->main unless caller;
60
61###############################################################################
62## Private
63###############################################################################
64
65## Display debug messages?
66my $debug = 0; # Set to 1 to display
67
68## Keep track of the driver objects we have initialised
69my $dbdriver_pool = {};
70
71# Testing globals
72my $test_count = 0;
73my $pass_count = 0;
74my $skip_count = 0;
75
76
77## @function _addPathsToINC(void) => void
78#
79# A hopefully unused function to ensure the INC path contains all the available
80# perllib directories (from main, collection, and extensions)
81#
82sub _addPathsToINC
[17087]83{
[30356]84 &_debugPrint('_addPathsToINC() => ', 0);
85 my @possible_paths;
86 #... the main perllib directory...
87 push(@possible_paths, &FileUtils::filenameConcatenate());
88 #... a collection specific perllib directory...
89 if (defined $ENV{'GSDLCOLLECTDIR'} && $ENV{'GSDLCOLLECTION'}) {
90 push(@possible_paths, &FileUtils::filenameConcatenate($ENV{'GSDLCOLLECTDIR'}, 'collect', $ENV{'GSDLCOLLECTION'}, 'perllib'));
91 }
92 #... any registered extension may also have a perllib!
93 if (defined $ENV{'GSDLEXTS'} && defined $ENV{'GSDLHOME'}) {
94 foreach my $gs2_extension (split(/:/, $ENV{'GSDLEXTS'})) {
95 push(@possible_paths, &FileUtils::filenameConcatenate($ENV{'GSDLHOME'}, 'ext', $gs2_extension, 'perllib'));
96 }
97 }
98 if (defined $ENV{'GSDL3EXTS'} && defined $ENV{'GSDL3SRCHOME'}) {
99 foreach my $gs3_extension (split(/:/, $ENV{'GSDL3EXTS'})) {
100 push(@possible_paths, &FileUtils::filenameConcatenate($ENV{'GSDL3SRCHOME'}, 'ext', $gs3_extension, 'perllib'));
101 }
102 }
103 my $path_counter = 0;
104 foreach my $possible_path (@possible_paths) {
105 # we only try adding paths that actually exist
106 if (-d $possible_path) {
107 my $did_add_path = &util::augmentINC($possible_path);
108 if ($did_add_path) {
109 $path_counter++;
110 }
111 }
112 }
113 &_debugPrint('Added ' . $path_counter . ' paths');
114}
115## _addPathsToINC(void) => void #
[17087]116
[30356]117
118## @function _debugPrint(string, boolean)
119#
120sub _debugPrint
121{
122 my ($message, $newline) = @_;
123 if ($debug) {
124 if (!defined($newline)) {
125 $newline = 1;
126 }
127 print STDERR '[DEBUG] dbutil::' . $message;
128 if ($newline) {
129 print STDERR "\n";
130 }
131 }
[17087]132}
[30356]133## _debugPrint(string, boolean) => void ##
[17087]134
135
[30356]136## @function _isDriverLoaded(string) => boolean
137#
138sub _isDriverLoaded
[16176]139{
[30356]140 my ($dbdriver_name) = @_;
141 (my $dbdriver_file = $dbdriver_name) =~ s/::/\//g;
142 $dbdriver_file .= '.pm';
143 my $result = defined($INC{$dbdriver_file});
144 &_debugPrint('_isDriverLoaded("' . $dbdriver_name . '") => ' . $result);
145 return $result;
146}
147## _isDriverLoaded(string) => boolean ##
[16176]148
[30356]149## @function _loadDBDriver(string, string)
150#
151sub _loadDBDriver
152{
153 my ($dbdriver_name, $db_filepath) = @_;
154 my $dbdriver;
155 # I've decided (arbitrarily) to use uppercase for driver names since they
156 # are mostly acronyms
157 $dbdriver_name = uc($dbdriver_name);
158 # Ensure the driver has the correct package prefix
159 if ($dbdriver_name !~ /^DBDrivers/) {
160 $dbdriver_name = 'DBDrivers::' . $dbdriver_name;
161 }
162 # We only need to create each driver once
163 if (defined($dbdriver_pool->{$dbdriver_name})) {
164 $dbdriver = $dbdriver_pool->{$dbdriver_name};
165 }
166 else {
167 &_debugPrint('_loadDBDriver() => ' . $dbdriver_name);
168 # Assuming the INC is correctly setup, then this should work nicely
169 # - make sure we have required this dbdriver package
170 eval "require $dbdriver_name";
171 if (&_isDriverLoaded($dbdriver_name)) {
172 $dbdriver_name->import();
173 }
174 # What should we do about drivers that aren't there?
175 else {
176 print STDERR "Error! Failed to load: " . $dbdriver_name . "\n";
177 }
178 # Then initialise and return a new one
179 $dbdriver = $dbdriver_name->new($debug);
180 # Store it for later use
181 $dbdriver_pool->{$dbdriver_name} = $dbdriver;
182 }
183 return $dbdriver;
[17104]184}
[30356]185## _loadDBDriver(string, string) => BaseDBDriver ##
[16176]186
187
[30356]188## @function _printTest(string, integer) => void
189#
190sub _printTest
[15727]191{
[30356]192 my $title = shift(@_);
193 my $result = shift(@_);
194 $test_count++;
195 print " - Test: " . $title . "... ";
196 if ($result) {
197 print "Passed\n";
198 $pass_count++;
199 }
200 else {
201 print "Failed\n";
202 }
[15727]203}
[30356]204## _printTest(string, integer) => void ##
[15727]205
206
[30356]207sub _compareHash
[15710]208{
[30356]209 my $hash1 = shift(@_);
210 my $hash2 = shift(@_);
211 my $str1 = &_hash2str($hash1);
212 my $str2 = &_hash2str($hash2);
213 return ($str1 eq $str2);
214}
[15710]215
[30356]216sub _hash2str
217{
218 my $hash = shift(@_);
219 my $str = '';
220 foreach my $key (sort keys %{$hash}) {
221 $str .= '{' . $key . '=>{{' . join('},{', @{$hash->{$key}}) . '}}}';
222 }
223 return $str;
[15710]224}
225
226
[30356]227###############################################################################
228## Public
229###############################################################################
[15705]230
231
[30356]232## @function main(void) => void
233#
234sub main
[22485]235{
[30356]236 my $t0 = [gettimeofday()];
237 my $data1 = {'doh' => ['a deer, a female deer'],
238 'ray' => ['a drop of golden sun'],
239 'me' => ['a name I call myself'],
240 'far' => ['a long, long way to run']};
241 my $data2 = {'sew' => ['a needle pulling thread'],
242 'lah' => ['a note to follow doh'],
243 'tea' => ['a drink with jam and bread'],
244 'doh' => ['which brings us back to']};
245 $test_count = 0;
246 $pass_count = 0;
247 $skip_count = 0;
248 print "===== DBUtils Testing Suite =====\n";
249 print "For each driver specified, run a battery of tests\n";
250 my @drivers;
251 foreach my $arg (@ARGV) {
252 if ($arg =~ /^-+([a-z]+)(=.+)?$/) {
253 my $arg_name = $1;
254 my $arg_value = $2;
255 if ($arg_name eq 'debug') {
256 $debug = 1;
257 }
258 }
259 else {
260 push(@drivers, $arg);
261 }
[22485]262 }
[30356]263 if (scalar(@drivers)) {
264 # Ensure the Perl can load the drivers from all the typical places
265 &_addPathsToINC();
266 foreach my $driver_name (@drivers) {
267 my $t1 = [gettimeofday()];
268 print "=== Testing: " . $driver_name . " ===\n";
269 my $driver = _loadDBDriver($driver_name);
270 my $db_path = $driver->get_infodb_file_path('test-doc','/tmp/');
271 print " - Path: " . $db_path . "\n";
272 # 1. Open handle
273 my $db_handle = $driver->open_infodb_write_handle($db_path);
274 &_printTest('opening handle', (defined $db_handle));
275 # 2a. Write entry
276 $driver->write_infodb_entry($db_handle, 'Alpha', $data1);
277 &_printTest('writing entry', 1);
278 # 2b. Write raw entry
279 my $raw_data = $driver->convert_infodb_hash_to_string($data1);
280 $driver->write_infodb_rawentry($db_handle, 'Beta', $raw_data);
281 &_printTest('writing raw entry', 1);
282 # 3. Close handle
283 $driver->close_infodb_write_handle($db_handle);
284 if ($driver->supportsPersistentConnection()) {
285 $test_count += 1;
286 $skip_count += 1;
287 print " - Skipping test as persistent drivers delay 'close'.\n";
288 }
289 else {
290 &_printTest('closing handle', (tell($db_handle) < 1));
291 }
292 if (!$driver->writeOnly()) {
293 # 4a. Read entry
294 my $data3 = $driver->read_infodb_entry($db_path, 'Alpha');
295 &_printTest('read entry', &_compareHash($data1, $data3));
296 # 4b. Read raw entry
297 my $raw_data4 = $driver->read_infodb_rawentry($db_path, 'Beta');
298 my $data4 = $driver->convert_infodb_string_to_hash($raw_data4);
299 &_printTest('read raw entry', &_compareHash($data1, $data4));
300 # 5. Read keys
301 my $keys1 = {};
302 $driver->read_infodb_keys($db_path, $keys1);
303 &_printTest('read keys', (defined $keys1->{'Alpha'} && defined $keys1->{'Beta'}));
304 # 6. Set entry
305 if ($driver->supportsSet()) {
306 my $status = $driver->set_infodb_entry($db_path, 'Alpha', $data2);
307 &_printTest('set entry (1)', ($status >= 0));
308 my $data5 = $driver->read_infodb_entry($db_path, 'Alpha');
309 &_printTest('set entry (2)', &_compareHash($data2, $data5));
310 }
311 else {
312 $test_count += 2;
313 $skip_count += 2;
314 print " - Skipping 2 tests as 'set' is not supported by this driver.\n";
315 }
316 # 7. Delete entry
317 my $db_handle2 = $driver->open_infodb_write_handle($db_path, 'append');
318 $driver->delete_infodb_entry($db_handle2, 'Alpha');
319 $driver->close_infodb_write_handle($db_handle2);
320 my $keys2 = {};
321 $driver->read_infodb_keys($db_path, $keys2);
322 &_printTest('delete entry', ((!defined $keys2->{'Alpha'}) && (defined $keys2->{'Beta'})));
323 }
324 else
325 {
326 $test_count += 6;
327 $skip_count += 6;
328 print " - Skipping 6 tests as driver is write-only.\n";
329 }
330 # 8. Remove test db
331 unlink($db_path);
332 my $t2 = [gettimeofday()];
333 my $elapsed1 = tv_interval($t1, $t2);
334 print " - Testing took " . $elapsed1 . " seconds\n";
335 }
336 print "===== Results =====\n";
337 print "Drivers Tested: " . scalar(@drivers) . "\n";
338 print "Tests Run: " . $test_count . "\n";
339 print "Tests Passed: " . $pass_count . "\n";
340 print "Tests Failed: " . ($test_count - $pass_count - $skip_count) . "\n";
341 print "Tests Skipped: " . $skip_count . "\n";
[22485]342 }
[30356]343 else
[22485]344 {
[30356]345 print "Warning! No drivers specified - expected as arguments to call\n";
[22485]346 }
[30356]347 my $t3 = [gettimeofday()];
348 my $elapsed2 = tv_interval($t0, $t3);
349 print "===== Complete in " . $elapsed2 . " seconds =====\n";
350 print "\n";
351 exit(0);
[22485]352}
[30356]353## main(void) => void
[15705]354
[30356]355
356## @function close_infodb_write_handle(string, *) => void
357#
358sub close_infodb_write_handle
[23485]359{
360 my $infodb_type = shift(@_);
[30356]361 my $driver = _loadDBDriver($infodb_type);
362 $driver->close_infodb_write_handle(@_);
363}
364## close_infodb_write_handle(string, *) => void ##
[23485]365
[30356]366
367## @function delete_infodb_entry(string, *) => void
368#
369sub delete_infodb_entry
370{
371 my $infodb_type = shift(@_);
372 my $driver = _loadDBDriver($infodb_type);
373 $driver->delete_infodb_entry(@_);
[23485]374}
[30356]375## delete_infodb_entry(string, *) => void ##
[23485]376
377
[30356]378## @function mergeDatabases(string, *) => integer
379#
380sub mergeDatabases
[21547]381{
[30356]382 my $infodb_type = shift(@_);
383 my $driver = _loadDBDriver($infodb_type);
384 my $status = $driver->mergeDatabases(@_);
385 return $status;
386}
387## mergeDatabases(string, *) => integer ##
[21547]388
[30356]389
390## @function get_default_infodb_type(void) => string
391#
392sub get_default_infodb_type
393{
394 # The default is GDBM so everything works the same for existing collections
395 # To use something else, specify the "infodbtype" in the collection's collect.cfg file
396 return 'gdbm';
[21547]397}
[30356]398## get_default_infodb_type(void) => string ##
[21547]399
400
[30356]401## @function get_infodb_file_path(string, *) => string
402#
403sub get_infodb_file_path
[15699]404{
[30356]405 my $infodb_type = shift(@_);
406 my $driver = _loadDBDriver($infodb_type);
407 my $infodb_file_path = $driver->get_infodb_file_path(@_);
408 return $infodb_file_path;
409}
410## get_infodb_file_path(string, *) => string ##
[15699]411
[15725]412
[30356]413## @function open_infodb_write_handle(string, *) => filehandle
414#
415sub open_infodb_write_handle
416{
417 my $infodb_type = shift(@_);
418 my $driver = _loadDBDriver($infodb_type);
419 my $infodb_handle = $driver->open_infodb_write_handle(@_);
420 return $infodb_handle;
[15699]421}
[30356]422## open_infodb_write_handle(string, *) => filehandle ##
[15699]423
[15705]424
[30356]425## @function read_infodb_file(string, *) => void
426#
427sub read_infodb_file
[21856]428{
[30356]429 my $infodb_type = shift(@_);
430 my $driver = _loadDBDriver($infodb_type);
431 $driver->read_infodb_file(@_);
432}
433## read_infodb_file(string, *) => void ##
[21856]434
435
[30356]436## @function read_infodb_keys(string, *) => void
437#
438sub read_infodb_keys
439{
440 my $infodb_type = shift(@_);
441 my $driver = _loadDBDriver($infodb_type);
442 $driver->read_infodb_keys(@_);
[21856]443}
[30356]444## read_infodb_keys(string, *) => void ##
[21856]445
446
[30356]447## @function read_infodb_entry(string, *) => hashmap
448#
449sub read_infodb_entry
[23399]450{
[30356]451 my $infodb_type = shift(@_);
452 my $driver = _loadDBDriver($infodb_type);
453 my $infodb_entry = $driver->read_infodb_entry(@_);
454 return $infodb_entry;
455}
456## read_infodb_entry(string, *) => hashmap ##
[21856]457
[23399]458
[30356]459## @function read_infodb_rawentry(string, *) => string
460#
461sub read_infodb_rawentry
462{
463 my $infodb_type = shift(@_);
464 my $driver = _loadDBDriver($infodb_type);
465 my $raw_infodb_entry = $driver->read_infodb_rawentry(@_);
466 return $raw_infodb_entry;
[23399]467}
[30356]468## read_infodb_rawentry(string, *) => string ##
[23399]469
470
[30356]471## @function set_infodb_entry(string, *) => integer
472#
473sub set_infodb_entry
[18467]474{
[30356]475 my $infodb_type = shift(@_);
476 my $driver = _loadDBDriver($infodb_type);
477 my $status = $driver->set_infodb_entry(@_);
478 return $status;
479}
480## set_infodb_entry(string, *) => integer ##
[15705]481
[18467]482
[30356]483## @function supportDatestamp(string) => boolean
484#
485sub supportsDatestamp
486{
487 my $infodb_type = shift(@_);
488 my $driver = _loadDBDriver($infodb_type);
489 my $supports_datestamp = $driver->supportsDatestamp();
490 return $supports_datestamp;
[18467]491}
[30356]492## supportsDatestamp(string) => boolean ##
[18467]493
494
[30356]495## @function supportMerge(string) => boolean
496#
497sub supportsMerge
[21550]498{
[30356]499 my $infodb_type = shift(@_);
500 my $driver = _loadDBDriver($infodb_type);
501 my $supports_merge = $driver->supportsMerge();
502 return $supports_merge;
503}
504## supportsMerge(string) => boolean ##
[21550]505
506
[30356]507## @function supportRSS(string) => boolean
508#
509sub supportsRSS
510{
511 my $infodb_type = shift(@_);
512 my $driver = _loadDBDriver($infodb_type);
513 my $supports_rss = $driver->supportsRSS();
514 return $supports_rss;
[21550]515}
[30356]516## supportsRSS(string) => boolean ##
[21550]517
518
[30356]519## @function write_infodb_entry(string, *) => void
520#
521sub write_infodb_entry
[21550]522{
[30356]523 my $infodb_type = shift(@_);
524 my $driver = _loadDBDriver($infodb_type);
525 $driver->write_infodb_entry(@_);
526}
527## write_infodb_entry(string, *) => void ##
[21550]528
529
[30356]530## @function write_infodb_rawentry(string, *) => void
531#
532sub write_infodb_rawentry
533{
534 my $infodb_type = shift(@_);
535 my $driver = _loadDBDriver($infodb_type);
536 $driver->write_infodb_rawentry(@_);
[21550]537}
[30356]538## write_infodb_rawentry(string, *) => void ##
[21550]539
[15699]5401;
Note: See TracBrowser for help on using the repository browser.