2 |
|
|
3 |
use strict; |
use strict; |
4 |
use Tracer; |
use Tracer; |
5 |
use DBKernel; |
use DBrtns; |
6 |
use Data::Dumper; |
use Data::Dumper; |
7 |
use XML::Simple; |
use XML::Simple; |
8 |
use DBQuery; |
use DBQuery; |
9 |
use DBObject; |
use DBObject; |
10 |
use Stats; |
use Stats; |
11 |
use Time::HiRes qw(gettimeofday); |
use Time::HiRes qw(gettimeofday); |
12 |
|
use FIG; |
13 |
|
|
14 |
=head1 Entity-Relationship Database Package |
=head1 Entity-Relationship Database Package |
15 |
|
|
301 |
# Table of information about our datatypes. "sqlType" is the corresponding SQL datatype string. |
# Table of information about our datatypes. "sqlType" is the corresponding SQL datatype string. |
302 |
# "maxLen" is the maximum permissible length of the incoming string data used to populate a field |
# "maxLen" is the maximum permissible length of the incoming string data used to populate a field |
303 |
# of the specified type. "dataGen" is PERL string that will be evaluated if no test data generation |
# of the specified type. "dataGen" is PERL string that will be evaluated if no test data generation |
304 |
#string is specified in the field definition. |
# string is specified in the field definition. "avgLen" is the average byte length for estimating |
305 |
my %TypeTable = ( char => { sqlType => 'CHAR(1)', maxLen => 1, dataGen => "StringGen('A')" }, |
# record sizes. |
306 |
int => { sqlType => 'INTEGER', maxLen => 20, dataGen => "IntGen(0, 99999999)" }, |
my %TypeTable = ( char => { sqlType => 'CHAR(1)', maxLen => 1, avgLen => 1, dataGen => "StringGen('A')" }, |
307 |
string => { sqlType => 'VARCHAR(255)', maxLen => 255, dataGen => "StringGen(IntGen(10,250))" }, |
int => { sqlType => 'INTEGER', maxLen => 20, avgLen => 4, dataGen => "IntGen(0, 99999999)" }, |
308 |
text => { sqlType => 'TEXT', maxLen => 1000000000, dataGen => "StringGen(IntGen(80,1000))" }, |
string => { sqlType => 'VARCHAR(255)', maxLen => 255, avgLen => 100, dataGen => "StringGen(IntGen(10,250))" }, |
309 |
date => { sqlType => 'BIGINT', maxLen => 80, dataGen => "DateGen(-7, 7, IntGen(0,1400))" }, |
text => { sqlType => 'TEXT', maxLen => 1000000000, avgLen => 500, dataGen => "StringGen(IntGen(80,1000))" }, |
310 |
float => { sqlType => 'DOUBLE PRECISION', maxLen => 40, dataGen => "FloatGen(0.0, 100.0)" }, |
date => { sqlType => 'BIGINT', maxLen => 80, avgLen => 8, dataGen => "DateGen(-7, 7, IntGen(0,1400))" }, |
311 |
boolean => { sqlType => 'SMALLINT', maxLen => 1, dataGen => "IntGen(0, 1)" }, |
float => { sqlType => 'DOUBLE PRECISION', maxLen => 40, avgLen => 8, dataGen => "FloatGen(0.0, 100.0)" }, |
312 |
|
boolean => { sqlType => 'SMALLINT', maxLen => 1, avgLen => 2, dataGen => "IntGen(0, 1)" }, |
313 |
'key-string' => |
'key-string' => |
314 |
{ sqlType => 'VARCHAR(40)', maxLen => 40, dataGen => "StringGen(IntGen(10,40))" }, |
{ sqlType => 'VARCHAR(40)', maxLen => 40, avgLen => 10, dataGen => "StringGen(IntGen(10,40))" }, |
315 |
'name-string' => |
'name-string' => |
316 |
{ sqlType => 'VARCHAR(80)', maxLen => 80, dataGen => "StringGen(IntGen(10,80))" }, |
{ sqlType => 'VARCHAR(80)', maxLen => 80, avgLen => 40, dataGen => "StringGen(IntGen(10,80))" }, |
317 |
'medium-string' => |
'medium-string' => |
318 |
{ sqlType => 'VARCHAR(160)', maxLen => 160, dataGen => "StringGen(IntGen(10,160))" }, |
{ sqlType => 'VARCHAR(160)', maxLen => 160, avgLen => 40, dataGen => "StringGen(IntGen(10,160))" }, |
319 |
); |
); |
320 |
|
|
321 |
# Table translating arities into natural language. |
# Table translating arities into natural language. |
371 |
|
|
372 |
=head3 ShowMetaData |
=head3 ShowMetaData |
373 |
|
|
374 |
C<< $database->ShowMetaData($fileName); >> |
C<< $erdb->ShowMetaData($fileName); >> |
375 |
|
|
376 |
This method outputs a description of the database. This description can be used to help users create |
This method outputs a description of the database. This description can be used to help users create |
377 |
the data to be loaded into the relations. |
the data to be loaded into the relations. |
526 |
|
|
527 |
=head3 DumpMetaData |
=head3 DumpMetaData |
528 |
|
|
529 |
C<< $database->DumpMetaData(); >> |
C<< $erdb->DumpMetaData(); >> |
530 |
|
|
531 |
Return a dump of the metadata structure. |
Return a dump of the metadata structure. |
532 |
|
|
541 |
|
|
542 |
=head3 CreateTables |
=head3 CreateTables |
543 |
|
|
544 |
C<< $datanase->CreateTables(); >> |
C<< $erdb->CreateTables(); >> |
545 |
|
|
546 |
This method creates the tables for the database from the metadata structure loaded by the |
This method creates the tables for the database from the metadata structure loaded by the |
547 |
constructor. It is expected this function will only be used on rare occasions, when the |
constructor. It is expected this function will only be used on rare occasions, when the |
579 |
|
|
580 |
=head3 CreateTable |
=head3 CreateTable |
581 |
|
|
582 |
C<< $database->CreateTable($tableName, $indexFlag); >> |
C<< $erdb->CreateTable($tableName, $indexFlag, $estimatedRows); >> |
583 |
|
|
584 |
Create the table for a relation and optionally create its indexes. |
Create the table for a relation and optionally create its indexes. |
585 |
|
|
589 |
|
|
590 |
Name of the relation (which will also be the table name). |
Name of the relation (which will also be the table name). |
591 |
|
|
592 |
=item $indexFlag |
=item indexFlag |
593 |
|
|
594 |
TRUE if the indexes for the relation should be created, else FALSE. If FALSE, |
TRUE if the indexes for the relation should be created, else FALSE. If FALSE, |
595 |
L</CreateIndexes> must be called later to bring the indexes into existence. |
L</CreateIndexes> must be called later to bring the indexes into existence. |
596 |
|
|
597 |
|
=item estimatedRows (optional) |
598 |
|
|
599 |
|
If specified, the estimated maximum number of rows for the relation. This |
600 |
|
information allows the creation of tables using storage engines that are |
601 |
|
faster but require size estimates, such as MyISAM. |
602 |
|
|
603 |
=back |
=back |
604 |
|
|
605 |
=cut |
=cut |
606 |
|
|
607 |
sub CreateTable { |
sub CreateTable { |
608 |
# Get the parameters. |
# Get the parameters. |
609 |
my ($self, $relationName, $indexFlag) = @_; |
my ($self, $relationName, $indexFlag, $estimatedRows) = @_; |
610 |
# Get the database handle. |
# Get the database handle. |
611 |
my $dbh = $self->{_dbh}; |
my $dbh = $self->{_dbh}; |
612 |
# Get the relation data and determine whether or not the relation is primary. |
# Get the relation data and determine whether or not the relation is primary. |
630 |
# Insure the table is not already there. |
# Insure the table is not already there. |
631 |
$dbh->drop_table(tbl => $relationName); |
$dbh->drop_table(tbl => $relationName); |
632 |
Trace("Table $relationName dropped.") if T(2); |
Trace("Table $relationName dropped.") if T(2); |
633 |
|
# If there are estimated rows, create an estimate so we can take advantage of |
634 |
|
# faster DB technologies. |
635 |
|
my $estimation = undef; |
636 |
|
if ($estimatedRows) { |
637 |
|
$estimation = [$self->EstimateRowSize($relationName), $estimatedRows]; |
638 |
|
} |
639 |
# Create the table. |
# Create the table. |
640 |
Trace("Creating table $relationName: $fieldThing") if T(2); |
Trace("Creating table $relationName: $fieldThing") if T(2); |
641 |
$dbh->create_table(tbl => $relationName, flds => $fieldThing); |
$dbh->create_table(tbl => $relationName, flds => $fieldThing, estimates => $estimation); |
642 |
Trace("Relation $relationName created in database.") if T(2); |
Trace("Relation $relationName created in database.") if T(2); |
643 |
# If we want to build the indexes, we do it here. |
# If we want to build the indexes, we do it here. |
644 |
if ($indexFlag) { |
if ($indexFlag) { |
648 |
|
|
649 |
=head3 CreateIndex |
=head3 CreateIndex |
650 |
|
|
651 |
C<< $database->CreateIndex($relationName); >> |
C<< $erdb->CreateIndex($relationName); >> |
652 |
|
|
653 |
Create the indexes for a relation. If a table is being loaded from a large source file (as |
Create the indexes for a relation. If a table is being loaded from a large source file (as |
654 |
is the case in L</LoadTable>), it is sometimes best to create the indexes after the load. |
is the case in L</LoadTable>), it is sometimes best to create the indexes after the load. |
681 |
|
|
682 |
=head3 LoadTables |
=head3 LoadTables |
683 |
|
|
684 |
C<< my $stats = $database->LoadTables($directoryName, $rebuild); >> |
C<< my $stats = $erdb->LoadTables($directoryName, $rebuild); >> |
685 |
|
|
686 |
This method will load the database tables from a directory. The tables must already have been created |
This method will load the database tables from a directory. The tables must already have been created |
687 |
in the database. (This can be done by calling L</CreateTables>.) The caller passes in a directory name; |
in the database. (This can be done by calling L</CreateTables>.) The caller passes in a directory name; |
751 |
|
|
752 |
=head3 GetTableNames |
=head3 GetTableNames |
753 |
|
|
754 |
C<< my @names = $database->GetTableNames; >> |
C<< my @names = $erdb->GetTableNames; >> |
755 |
|
|
756 |
Return a list of the relations required to implement this database. |
Return a list of the relations required to implement this database. |
757 |
|
|
768 |
|
|
769 |
=head3 GetEntityTypes |
=head3 GetEntityTypes |
770 |
|
|
771 |
C<< my @names = $database->GetEntityTypes; >> |
C<< my @names = $erdb->GetEntityTypes; >> |
772 |
|
|
773 |
Return a list of the entity type names. |
Return a list of the entity type names. |
774 |
|
|
783 |
return sort keys %{$entityList}; |
return sort keys %{$entityList}; |
784 |
} |
} |
785 |
|
|
786 |
|
=head3 IsEntity |
787 |
|
|
788 |
|
C<< my $flag = $erdb->IsEntity($entityName); >> |
789 |
|
|
790 |
|
Return TRUE if the parameter is an entity name, else FALSE. |
791 |
|
|
792 |
|
=over 4 |
793 |
|
|
794 |
|
=item entityName |
795 |
|
|
796 |
|
Object name to be tested. |
797 |
|
|
798 |
|
=item RETURN |
799 |
|
|
800 |
|
Returns TRUE if the specified string is an entity name, else FALSE. |
801 |
|
|
802 |
|
=back |
803 |
|
|
804 |
|
=cut |
805 |
|
|
806 |
|
sub IsEntity { |
807 |
|
# Get the parameters. |
808 |
|
my ($self, $entityName) = @_; |
809 |
|
# Test to see if it's an entity. |
810 |
|
return exists $self->{_metaData}->{Entities}->{$entityName}; |
811 |
|
} |
812 |
|
|
813 |
=head3 Get |
=head3 Get |
814 |
|
|
815 |
C<< my $query = $database->Get(\@objectNames, $filterClause, $param1, $param2, ..., $paramN); >> |
C<< my $query = $erdb->Get(\@objectNames, $filterClause, $param1, $param2, ..., $paramN); >> |
816 |
|
|
817 |
This method returns a query object for entities of a specified type using a specified filter. |
This method returns a query object for entities of a specified type using a specified filter. |
818 |
The filter is a standard WHERE/ORDER BY clause with question marks as parameter markers and each |
The filter is a standard WHERE/ORDER BY clause with question marks as parameter markers and each |
820 |
following call requests all B<Genome> objects for the genus specified in the variable |
following call requests all B<Genome> objects for the genus specified in the variable |
821 |
$genus. |
$genus. |
822 |
|
|
823 |
C<< $query = $sprout->Get(['Genome'], "Genome(genus) = ?", $genus); >> |
C<< $query = $erdb->Get(['Genome'], "Genome(genus) = ?", $genus); >> |
824 |
|
|
825 |
The WHERE clause contains a single question mark, so there is a single additional |
The WHERE clause contains a single question mark, so there is a single additional |
826 |
parameter representing the parameter value. It would also be possible to code |
parameter representing the parameter value. It would also be possible to code |
827 |
|
|
828 |
C<< $query = $sprout->Get(['Genome'], "Genome(genus) = \'$genus\'"); >> |
C<< $query = $erdb->Get(['Genome'], "Genome(genus) = \'$genus\'"); >> |
829 |
|
|
830 |
however, this version of the call would generate a syntax error if there were any quote |
however, this version of the call would generate a syntax error if there were any quote |
831 |
characters inside the variable C<$genus>. |
characters inside the variable C<$genus>. |
837 |
It is possible to specify multiple entity and relationship names in order to retrieve more than |
It is possible to specify multiple entity and relationship names in order to retrieve more than |
838 |
one object's data at the same time, which allows highly complex joined queries. For example, |
one object's data at the same time, which allows highly complex joined queries. For example, |
839 |
|
|
840 |
C<< $query = $sprout->Get(['Genome', 'ComesFrom', 'Source'], "Genome(genus) = ?", $genus); >> |
C<< $query = $erdb->Get(['Genome', 'ComesFrom', 'Source'], "Genome(genus) = ?", $genus); >> |
841 |
|
|
842 |
If multiple names are specified, then the query processor will automatically determine a |
If multiple names are specified, then the query processor will automatically determine a |
843 |
join path between the entities and relationships. The algorithm used is very simplistic. |
join path between the entities and relationships. The algorithm used is very simplistic. |
1000 |
$command .= " ORDER BY $orderClause"; |
$command .= " ORDER BY $orderClause"; |
1001 |
} |
} |
1002 |
} |
} |
1003 |
Trace("SQL query: $command") if T(2); |
Trace("SQL query: $command") if T(3); |
1004 |
Trace("PARMS: '" . (join "', '", @params) . "'") if (T(3) && (@params > 0)); |
Trace("PARMS: '" . (join "', '", @params) . "'") if (T(4) && (@params > 0)); |
1005 |
my $sth = $dbh->prepare_command($command); |
my $sth = $dbh->prepare_command($command); |
1006 |
# Execute it with the parameters bound in. |
# Execute it with the parameters bound in. |
1007 |
$sth->execute(@params) || Confess("SELECT error" . $sth->errstr()); |
$sth->execute(@params) || Confess("SELECT error" . $sth->errstr()); |
1012 |
|
|
1013 |
=head3 GetList |
=head3 GetList |
1014 |
|
|
1015 |
C<< my @dbObjects = $database->GetList(\@objectNames, $filterClause, $param1, $param2, ..., $paramN); >> |
C<< my @dbObjects = $erdb->GetList(\@objectNames, $filterClause, $param1, $param2, ..., $paramN); >> |
1016 |
|
|
1017 |
Return a list of object descriptors for the specified objects as determined by the |
Return a list of object descriptors for the specified objects as determined by the |
1018 |
specified filter clause. |
specified filter clause. |
1075 |
|
|
1076 |
=head3 ComputeObjectSentence |
=head3 ComputeObjectSentence |
1077 |
|
|
1078 |
C<< my $sentence = $database->ComputeObjectSentence($objectName); >> |
C<< my $sentence = $erdb->ComputeObjectSentence($objectName); >> |
1079 |
|
|
1080 |
Check an object name, and if it is a relationship convert it to a relationship sentence. |
Check an object name, and if it is a relationship convert it to a relationship sentence. |
1081 |
|
|
1110 |
|
|
1111 |
=head3 DumpRelations |
=head3 DumpRelations |
1112 |
|
|
1113 |
C<< $database->DumpRelations($outputDirectory); >> |
C<< $erdb->DumpRelations($outputDirectory); >> |
1114 |
|
|
1115 |
Write the contents of all the relations to tab-delimited files in the specified directory. |
Write the contents of all the relations to tab-delimited files in the specified directory. |
1116 |
Each file will have the same name as the relation dumped, with an extension of DTX. |
Each file will have the same name as the relation dumped, with an extension of DTX. |
1152 |
|
|
1153 |
=head3 InsertObject |
=head3 InsertObject |
1154 |
|
|
1155 |
C<< my $ok = $database->InsertObject($objectType, \%fieldHash); >> |
C<< my $ok = $erdb->InsertObject($objectType, \%fieldHash); >> |
1156 |
|
|
1157 |
Insert an object into the database. The object is defined by a type name and then a hash |
Insert an object into the database. The object is defined by a type name and then a hash |
1158 |
of field names to values. Field values in the primary relation are represented by scalars. |
of field names to values. Field values in the primary relation are represented by scalars. |
1161 |
example, the following line inserts an inactive PEG feature named C<fig|188.1.peg.1> with aliases |
example, the following line inserts an inactive PEG feature named C<fig|188.1.peg.1> with aliases |
1162 |
C<ZP_00210270.1> and C<gi|46206278>. |
C<ZP_00210270.1> and C<gi|46206278>. |
1163 |
|
|
1164 |
C<< $database->InsertObject('Feature', { id => 'fig|188.1.peg.1', active => 0, feature-type => 'peg', alias => ['ZP_00210270.1', 'gi|46206278']}); >> |
C<< $erdb->InsertObject('Feature', { id => 'fig|188.1.peg.1', active => 0, feature-type => 'peg', alias => ['ZP_00210270.1', 'gi|46206278']}); >> |
1165 |
|
|
1166 |
The next statement inserts a C<HasProperty> relationship between feature C<fig|158879.1.peg.1> and |
The next statement inserts a C<HasProperty> relationship between feature C<fig|158879.1.peg.1> and |
1167 |
property C<4> with an evidence URL of C<http://seedu.uchicago.edu/query.cgi?article_id=142>. |
property C<4> with an evidence URL of C<http://seedu.uchicago.edu/query.cgi?article_id=142>. |
1168 |
|
|
1169 |
C<< $database->InsertObject('HasProperty', { 'from-link' => 'fig|158879.1.peg.1', 'to-link' => 4, evidence = 'http://seedu.uchicago.edu/query.cgi?article_id=142'}); >> |
C<< $erdb->InsertObject('HasProperty', { 'from-link' => 'fig|158879.1.peg.1', 'to-link' => 4, evidence = 'http://seedu.uchicago.edu/query.cgi?article_id=142'}); >> |
1170 |
|
|
1171 |
=over 4 |
=over 4 |
1172 |
|
|
1291 |
|
|
1292 |
=head3 LoadTable |
=head3 LoadTable |
1293 |
|
|
1294 |
C<< my %results = $database->LoadTable($fileName, $relationName, $truncateFlag); >> |
C<< my %results = $erdb->LoadTable($fileName, $relationName, $truncateFlag); >> |
1295 |
|
|
1296 |
Load data from a tab-delimited file into a specified table, optionally re-creating the table |
Load data from a tab-delimited file into a specified table, optionally re-creating the table |
1297 |
first. |
first. |
1332 |
# Check the truncation flag. |
# Check the truncation flag. |
1333 |
if ($truncateFlag) { |
if ($truncateFlag) { |
1334 |
Trace("Creating table $relationName") if T(2); |
Trace("Creating table $relationName") if T(2); |
1335 |
|
# Compute the row count estimate. We take the size of the load file, |
1336 |
|
# divide it by the estimated row size, and then multiply by 1.5 to |
1337 |
|
# leave extra room. We postulate a minimum row count of 1000 to |
1338 |
|
# prevent problems with incoming empty load files. |
1339 |
|
my $rowSize = $self->EstimateRowSize($relationName); |
1340 |
|
my $fileSize = -s $fileName; |
1341 |
|
my $estimate = FIG::max($fileSize * 1.5 / $rowSize, 1000); |
1342 |
# Re-create the table without its index. |
# Re-create the table without its index. |
1343 |
$self->CreateTable($relationName, 0); |
$self->CreateTable($relationName, 0, $estimate); |
1344 |
# If this is a pre-index DBMS, create the index here. |
# If this is a pre-index DBMS, create the index here. |
1345 |
if ($dbh->{_preIndex}) { |
if ($dbh->{_preIndex}) { |
1346 |
eval { |
eval { |
1351 |
} |
} |
1352 |
} |
} |
1353 |
} |
} |
|
# Determine whether or not this is a primary relation. Primary relations have an extra |
|
|
# field indicating whether or not a given object is new or was loaded from the flat files. |
|
|
my $primary = $self->_IsPrimary($relationName); |
|
|
# Get the number of fields in this relation. |
|
|
my @fieldList = @{$relation->{Fields}}; |
|
|
my $fieldCount = @fieldList; |
|
|
# Start a database transaction. |
|
|
$dbh->begin_tran; |
|
|
# Open the relation file. We need to create a cleaned-up copy before loading. |
|
|
open TABLEIN, '<', $fileName; |
|
|
my $tempName = "$fileName.tbl"; |
|
|
open TABLEOUT, '>', $tempName; |
|
|
my $inputCount = 0; |
|
|
# Loop through the file. |
|
|
while (<TABLEIN>) { |
|
|
$inputCount++; |
|
|
# Chop off the new-line character. |
|
|
my $record = Tracer::Strip($_); |
|
|
# Only proceed if the record is non-blank. |
|
|
if ($record) { |
|
|
# Escape all the backslashes found in the line. |
|
|
$record =~ s/\\/\\\\/g; |
|
|
# Insure the number of fields is correct. |
|
|
my @fields = split /\t/, $record; |
|
|
while (@fields > $fieldCount) { |
|
|
my $extraField = $fields[$#fields]; |
|
|
delete $fields[$#fields]; |
|
|
if ($extraField) { |
|
|
Trace("Nonblank extra field value \"$extraField\" deleted from record $inputCount of $fileName.") if T(1); |
|
|
} |
|
|
} |
|
|
while (@fields < $fieldCount) { |
|
|
push @fields, ""; |
|
|
} |
|
|
# If this is a primary relation, add a 0 for the new-record flag (indicating that |
|
|
# this record is not new, but part of the original load). |
|
|
if ($primary) { |
|
|
push @fields, "0"; |
|
|
} |
|
|
# Write the record. |
|
|
$record = join "\t", @fields; |
|
|
print TABLEOUT "$record\n"; |
|
|
# Count the record written. |
|
|
my $count = $retVal->Add('records'); |
|
|
my $len = length $record; |
|
|
Trace("Record $count written with $len characters.") if T(4); |
|
|
} else { |
|
|
# Here we have a blank record. |
|
|
$retVal->Add('skipped'); |
|
|
} |
|
|
} |
|
|
# Close the files. |
|
|
close TABLEIN; |
|
|
close TABLEOUT; |
|
|
Trace("Temporary file $tempName created.") if T(2); |
|
1354 |
# Load the table. |
# Load the table. |
1355 |
my $rv; |
my $rv; |
1356 |
eval { |
eval { |
1357 |
$rv = $dbh->load_table(file => $tempName, tbl => $relationName); |
$rv = $dbh->load_table(file => $fileName, tbl => $relationName); |
1358 |
}; |
}; |
1359 |
if (!defined $rv) { |
if (!defined $rv) { |
1360 |
$retVal->AddMessage($@) if ($@); |
$retVal->AddMessage($@) if ($@); |
1361 |
$retVal->AddMessage("Table load failed for $relationName using $tempName."); |
$retVal->AddMessage("Table load failed for $relationName using $fileName."); |
1362 |
Trace("Table load failed for $relationName.") if T(1); |
Trace("Table load failed for $relationName.") if T(1); |
1363 |
} else { |
} else { |
1364 |
# Here we successfully loaded the table. Trace the number of records loaded. |
# Here we successfully loaded the table. Trace the number of records loaded. |
1375 |
} |
} |
1376 |
# Commit the database changes. |
# Commit the database changes. |
1377 |
$dbh->commit_tran; |
$dbh->commit_tran; |
1378 |
# Delete the temporary file. |
# Analyze the table to improve performance. |
1379 |
unlink $tempName; |
$dbh->vacuum_it($relationName); |
1380 |
# Return the statistics. |
# Return the statistics. |
1381 |
return $retVal; |
return $retVal; |
1382 |
} |
} |
1383 |
|
|
1384 |
=head3 GenerateEntity |
=head3 GenerateEntity |
1385 |
|
|
1386 |
C<< my $fieldHash = $database->GenerateEntity($id, $type, \%values); >> |
C<< my $fieldHash = $erdb->GenerateEntity($id, $type, \%values); >> |
1387 |
|
|
1388 |
Generate the data for a new entity instance. This method creates a field hash suitable for |
Generate the data for a new entity instance. This method creates a field hash suitable for |
1389 |
passing as a parameter to L</InsertObject>. The ID is specified by the callr, but the rest |
passing as a parameter to L</InsertObject>. The ID is specified by the callr, but the rest |
1441 |
|
|
1442 |
=head3 GetEntity |
=head3 GetEntity |
1443 |
|
|
1444 |
C<< my $entityObject = $sprout->GetEntity($entityType, $ID); >> |
C<< my $entityObject = $erdb->GetEntity($entityType, $ID); >> |
1445 |
|
|
1446 |
Return an object describing the entity instance with a specified ID. |
Return an object describing the entity instance with a specified ID. |
1447 |
|
|
1477 |
|
|
1478 |
=head3 GetEntityValues |
=head3 GetEntityValues |
1479 |
|
|
1480 |
C<< my @values = GetEntityValues($entityType, $ID, \@fields); >> |
C<< my @values = $erdb->GetEntityValues($entityType, $ID, \@fields); >> |
1481 |
|
|
1482 |
Return a list of values from a specified entity instance. |
Return a list of values from a specified entity instance. |
1483 |
|
|
1520 |
|
|
1521 |
=head3 GetAll |
=head3 GetAll |
1522 |
|
|
1523 |
C<< my @list = $sprout->GetAll(\@objectNames, $filterClause, \@parameters, \@fields, $count); >> |
C<< my @list = $erdb->GetAll(\@objectNames, $filterClause, \@parameters, \@fields, $count); >> |
1524 |
|
|
1525 |
Return a list of values taken from the objects returned by a query. The first three |
Return a list of values taken from the objects returned by a query. The first three |
1526 |
parameters correspond to the parameters of the L</Get> method. The final parameter is |
parameters correspond to the parameters of the L</Get> method. The final parameter is |
1536 |
spreadsheet cell, and each feature will be represented by a list containing the |
spreadsheet cell, and each feature will be represented by a list containing the |
1537 |
feature ID followed by all of its aliases. |
feature ID followed by all of its aliases. |
1538 |
|
|
1539 |
C<< $query = $sprout->Get(['ContainsFeature', 'Feature'], "ContainsFeature(from-link) = ?", [$ssCellID], ['Feature(id)', 'Feature(alias)']); >> |
C<< $query = $erdb->Get(['ContainsFeature', 'Feature'], "ContainsFeature(from-link) = ?", [$ssCellID], ['Feature(id)', 'Feature(alias)']); >> |
1540 |
|
|
1541 |
=over 4 |
=over 4 |
1542 |
|
|
1605 |
return @retVal; |
return @retVal; |
1606 |
} |
} |
1607 |
|
|
1608 |
|
=head3 EstimateRowSize |
1609 |
|
|
1610 |
|
C<< my $rowSize = $erdb->EstimateRowSize($relName); >> |
1611 |
|
|
1612 |
|
Estimate the row size of the specified relation. The estimated row size is computed by adding |
1613 |
|
up the average length for each data type. |
1614 |
|
|
1615 |
|
=over 4 |
1616 |
|
|
1617 |
|
=item relName |
1618 |
|
|
1619 |
|
Name of the relation whose estimated row size is desired. |
1620 |
|
|
1621 |
|
=item RETURN |
1622 |
|
|
1623 |
|
Returns an estimate of the row size for the specified relation. |
1624 |
|
|
1625 |
|
=back |
1626 |
|
|
1627 |
|
=cut |
1628 |
|
#: Return Type $; |
1629 |
|
sub EstimateRowSize { |
1630 |
|
# Get the parameters. |
1631 |
|
my ($self, $relName) = @_; |
1632 |
|
# Declare the return variable. |
1633 |
|
my $retVal = 0; |
1634 |
|
# Find the relation descriptor. |
1635 |
|
my $relation = $self->_FindRelation($relName); |
1636 |
|
# Get the list of fields. |
1637 |
|
for my $fieldData (@{$relation->{Fields}}) { |
1638 |
|
# Get the field type and add its length. |
1639 |
|
my $fieldLen = $TypeTable{$fieldData->{type}}->{avgLen}; |
1640 |
|
$retVal += $fieldLen; |
1641 |
|
} |
1642 |
|
# Return the result. |
1643 |
|
return $retVal; |
1644 |
|
} |
1645 |
|
|
1646 |
=head2 Internal Utility Methods |
=head2 Internal Utility Methods |
1647 |
|
|
1648 |
=head3 GetLoadStats |
=head3 GetLoadStats |
2018 |
sub _LoadMetaData { |
sub _LoadMetaData { |
2019 |
# Get the parameters. |
# Get the parameters. |
2020 |
my ($filename) = @_; |
my ($filename) = @_; |
2021 |
|
Trace("Reading Sprout DBD from $filename.") if T(2); |
2022 |
# Slurp the XML file into a variable. Extensive use of options is used to insure we |
# Slurp the XML file into a variable. Extensive use of options is used to insure we |
2023 |
# get the exact structure we want. |
# get the exact structure we want. |
2024 |
my $metadata = XML::Simple::XMLin($filename, |
my $metadata = XML::Simple::XMLin($filename, |
2225 |
my @fromList = (); |
my @fromList = (); |
2226 |
my @toList = (); |
my @toList = (); |
2227 |
my @bothList = (); |
my @bothList = (); |
2228 |
Trace("Join table build for $entityName.") if T(3); |
Trace("Join table build for $entityName.") if T(4); |
2229 |
for my $relationshipName (keys %{$relationshipList}) { |
for my $relationshipName (keys %{$relationshipList}) { |
2230 |
my $relationship = $relationshipList->{$relationshipName}; |
my $relationship = $relationshipList->{$relationshipName}; |
2231 |
# Determine if this relationship has our entity in one of its link fields. |
# Determine if this relationship has our entity in one of its link fields. |
2232 |
my $fromEntity = $relationship->{from}; |
my $fromEntity = $relationship->{from}; |
2233 |
my $toEntity = $relationship->{to}; |
my $toEntity = $relationship->{to}; |
2234 |
Trace("Join check for relationship $relationshipName from $fromEntity to $toEntity.") if T(3); |
Trace("Join check for relationship $relationshipName from $fromEntity to $toEntity.") if T(4); |
2235 |
if ($fromEntity eq $entityName) { |
if ($fromEntity eq $entityName) { |
2236 |
if ($toEntity eq $entityName) { |
if ($toEntity eq $entityName) { |
2237 |
# Here the relationship is recursive. |
# Here the relationship is recursive. |
2238 |
push @bothList, $relationshipName; |
push @bothList, $relationshipName; |
2239 |
Trace("Relationship $relationshipName put in both-list.") if T(3); |
Trace("Relationship $relationshipName put in both-list.") if T(4); |
2240 |
} else { |
} else { |
2241 |
# Here the relationship comes from the entity. |
# Here the relationship comes from the entity. |
2242 |
push @fromList, $relationshipName; |
push @fromList, $relationshipName; |
2243 |
Trace("Relationship $relationshipName put in from-list.") if T(3); |
Trace("Relationship $relationshipName put in from-list.") if T(4); |
2244 |
} |
} |
2245 |
} elsif ($toEntity eq $entityName) { |
} elsif ($toEntity eq $entityName) { |
2246 |
# Here the relationship goes to the entity. |
# Here the relationship goes to the entity. |
2247 |
push @toList, $relationshipName; |
push @toList, $relationshipName; |
2248 |
Trace("Relationship $relationshipName put in to-list.") if T(3); |
Trace("Relationship $relationshipName put in to-list.") if T(4); |
2249 |
} |
} |
2250 |
} |
} |
2251 |
# Create the nonrecursive joins. Note that we build two hashes for running |
# Create the nonrecursive joins. Note that we build two hashes for running |
2291 |
# relationship can only be ambiguous with another recursive relationship, |
# relationship can only be ambiguous with another recursive relationship, |
2292 |
# and the incoming relationship from the outer loop is never recursive. |
# and the incoming relationship from the outer loop is never recursive. |
2293 |
for my $otherName (@bothList) { |
for my $otherName (@bothList) { |
2294 |
Trace("Setting up relationship joins to recursive relationship $otherName with $relationshipName.") if T(3); |
Trace("Setting up relationship joins to recursive relationship $otherName with $relationshipName.") if T(4); |
2295 |
# Join from the left. |
# Join from the left. |
2296 |
$joinTable{"$relationshipName/$otherName"} = |
$joinTable{"$relationshipName/$otherName"} = |
2297 |
"$linkField = $otherName.from_link"; |
"$linkField = $otherName.from_link"; |
2306 |
# rise to situations where we can't create the path we want; however, it is always |
# rise to situations where we can't create the path we want; however, it is always |
2307 |
# possible to get the same effect using multiple queries. |
# possible to get the same effect using multiple queries. |
2308 |
for my $relationshipName (@bothList) { |
for my $relationshipName (@bothList) { |
2309 |
Trace("Setting up entity joins to recursive relationship $relationshipName with $entityName.") if T(3); |
Trace("Setting up entity joins to recursive relationship $relationshipName with $entityName.") if T(4); |
2310 |
# Join to the entity from each direction. |
# Join to the entity from each direction. |
2311 |
$joinTable{"$entityName/$relationshipName"} = |
$joinTable{"$entityName/$relationshipName"} = |
2312 |
"$entityName.id = $relationshipName.from_link"; |
"$entityName.id = $relationshipName.from_link"; |