###################################################################### # # EPrints::Database # ###################################################################### # # ###################################################################### =pod =for Pod2Wiki =head1 NAME B - a connection to the SQL database for an eprints session. =head1 DESCRIPTION EPrints Database Access Module Provides access to the backend database. All database access done via this module, in the hope that the backend can be replaced as easily as possible. In most use-cases it should not be necessary to use the database module directly. Instead you should use L or L accessor methods to access objects and field values respectively. =head2 Cross-database Support Any use of SQL statements must use L to quote database tables and columns and quote_value to quote values. The only exception to this are the EPrints::Database::* modules which provide database-driver specific extensions. =head2 Quoting SQL Values By convention variables that contain already quoted values are prefixed with C so they can be easily recognised when used in string interpolation: my $Q_value = $db->quote_value( "Hello, World!" ); $db->do("SELECT $Q_value"); Where possible you should avoid quoting values yourself, instead use a method that accepts unquoted values which will (safely) do the work for you. =head1 CONSTANTS All the C column types defined by Perl module L and the following: =over 4 =item SQL_NULL A column value is undefined. =item SQL_NOT_NULL A column value is defined. =back =head1 INSTANCE VARIABLES =over 4 =item $self->{session} The L which is associated with this database connection. =item $self->{debug} If C then SQL is logged. =item $self->{dbh} The handle on the actual database connection. =back =cut ###################################################################### package EPrints::Database; use DBI (); use APR::UUID; use EPrints; require Exporter; @ISA = qw( Exporter ); use constant { SQL_NULL => 0, SQL_NOT_NULL => 1, SQL_VARCHAR => DBI::SQL_VARCHAR, SQL_LONGVARCHAR => DBI::SQL_LONGVARCHAR, SQL_VARBINARY => DBI::SQL_VARBINARY, SQL_LONGVARBINARY => DBI::SQL_LONGVARBINARY, SQL_TINYINT => DBI::SQL_TINYINT, SQL_SMALLINT => DBI::SQL_SMALLINT, SQL_INTEGER => DBI::SQL_INTEGER, SQL_BIGINT => DBI::SQL_BIGINT, SQL_REAL => DBI::SQL_REAL, SQL_DOUBLE => DBI::SQL_DOUBLE, SQL_DATE => DBI::SQL_DATE, SQL_TIME => DBI::SQL_TIME, SQL_CLOB => DBI::SQL_CLOB, SQL_DECIMAL => DBI::SQL_DECIMAL, }; %EXPORT_TAGS = ( sql_types => [qw( SQL_NULL SQL_NOT_NULL SQL_VARCHAR SQL_LONGVARCHAR SQL_CLOB SQL_VARBINARY SQL_LONGVARBINARY SQL_TINYINT SQL_SMALLINT SQL_INTEGER SQL_BIGINT SQL_REAL SQL_DOUBLE SQL_DATE SQL_TIME )], ); Exporter::export_tags( qw( sql_types ) ); use strict; my $DEBUG_SQL = 0; # this may not be the current version of eprints, it's the version # of eprints where the current desired db configuration became standard. $EPrints::Database::DBVersion = "3.3.4"; # ID of next buffer table. This can safely reset to zero each time # The module restarts as it is only used for temporary tables. # my $NEXTBUFFER = 0; my %TEMPTABLES = (); ###################################################################### =pod =head1 METHODS =head2 Database =cut ###################################################################### ###################################################################### =pod =over 4 =item $db = EPrints::Database->new( $repo, [ %opts ] ) Create a connection to the database. Options: db_connect - Boolean. Also connect to the database (default: true). =cut ###################################################################### sub new { my( $class, $repo, %opts ) = @_; my $db_connect = exists($opts{db_connect}) ? $opts{db_connect} : 1; my $self = $class->_new( $repo ); if( $db_connect ) { $self->connect; if( !defined $self->{dbh} ) { return( undef ); } } return( $self ); } sub _new { my( $class, $session ) = @_; my $driver = $session->config( "dbdriver" ); $driver ||= "mysql"; $class = "${class}::$driver"; eval "use $class; 1"; die $@ if $@; my $self = bless { session => $session }, $class; Scalar::Util::weaken($self->{session}) if defined &Scalar::Util::weaken; $self->{debug} = $DEBUG_SQL; if( $session->{noise} == 3 ) { $self->{debug} = 1; } return $self; } ###################################################################### =pod =item $db = $db->create( $username, $password ) Create and connect to a new database using user account C<$username> and C<$password>. =cut ###################################################################### sub create { my( $self, $username, $password ) = @_; EPrints::abort( "Current database driver does not support database creation" ); } ###################################################################### =pod =item $dbstr = EPrints::Database::build_connection_string( %params ) Build the string to use to connect to the database via L. Parameters: dbname - Database name (REQUIRED). dbdriver - Database driver (e.g. mysql, Oracle, pgsql, default: mysql). dbhost - Database host. Assumes localhost if unset. dbport - Port to connect to database host. Assumes default for driver if unset. dbsock - Socket file to connect to database through. =cut ###################################################################### sub build_connection_string { my( %params ) = @_; $params{dbdriver} ||= "mysql"; # build the connection string my $dsn = "DBI:$params{dbdriver}:"; if( $params{dbdriver} eq "Oracle" ) { $dsn .= "sid=$params{dbsid}"; } else { $dsn .= "database=$params{dbname}"; } if( defined $params{dbhost} ) { $dsn.= ";host=".$params{dbhost}; } if( defined $params{dbport} ) { $dsn.= ";port=".$params{dbport}; } if( defined $params{dbsock} ) { $dsn.= ";mysql_socket=".$params{dbsock}; } if ( $params{dbdriver} eq "mysql" ) { $dsn.= ";mysql_enable_utf8=1"; } return $dsn; } ###################################################################### =pod =item $db->connect() Connects to the database. =cut ###################################################################### sub connect { my( $self ) = @_; my $repo = $self->{session}; # Connect to the database $self->{dbh} = DBI->connect_cached( build_connection_string( dbdriver => $repo->config("dbdriver"), dbhost => $repo->config("dbhost"), dbsock => $repo->config("dbsock"), dbport => $repo->config("dbport"), dbname => $repo->config("dbname"), ), $repo->config("dbuser"), $repo->config("dbpass"), { AutoCommit => 1, } ); return unless defined $self->{dbh}; if( $repo->{noise} >= 4 ) { $self->{dbh}->trace( 2 ); } return 1; } ###################################################################### =pod =item $db->disconnect() Disconnects from the EPrints database. Should always be done before any script exits. =cut ###################################################################### sub disconnect { my( $self ) = @_; # Make sure that we don't disconnect twice, or inappropriately if( defined $self->{dbh} ) { $self->{dbh}->disconnect() || $self->{session}->get_repository->log( "Database disconnect error: ". $self->{dbh}->errstr ); } delete $self->{session}; } ###################################################################### =pod =item $db->set_debug( $boolean ) Set the SQL debug mode to C or C. =cut ###################################################################### sub set_debug { my( $self, $debug ) = @_; $self->{debug} = $debug; } ###################################################################### =pod =item $db->set_version( $versionid ); Set the version id table in the SQL database to the given C (used by the upgrade script). =cut ###################################################################### sub set_version { my( $self, $versionid ) = @_; my $sql; my $Q_version = $self->quote_identifier( "version" ); $sql = "UPDATE $Q_version SET $Q_version = ".$self->quote_value( $versionid ); $self->do( $sql ); if( $self->{session}->get_noise >= 1 ) { print "Set DB compatibility flag to '$versionid'.\n"; } } ###################################################################### =pod =item $version = $db->get_version Returns the current database schema version. =cut ###################################################################### sub get_version { my( $self ) = @_; local $self->{dbh}->{PrintError} = 0; local $self->{dbh}->{RaiseError} = 0; my $Q_version = $self->quote_identifier( "version" ); my $sql = "SELECT $Q_version FROM $Q_version"; my( $version ) = $self->{dbh}->selectrow_array( $sql ); return $version; } ###################################################################### =pod =item $boolean = $db->is_latest_version Return C if the SQL tables are in the correct configuration for this edition of eprints. Otherwise, C. =cut ###################################################################### sub is_latest_version { my( $self ) = @_; my $version = $self->get_version; return 0 unless( defined $version ); return $version eq $EPrints::Database::DBVersion; } ###################################################################### =pod =item $version = $db->get_server_version Return the database server version. =cut ###################################################################### sub get_server_version {} ###################################################################### =pod =item $charset = $db->get_default_charset Return the character set to use. Returns C if character sets are unsupported. =cut ###################################################################### sub get_default_charset {} ###################################################################### =pod =item $collation = $db->get_default_collation( $lang ) Return the collation to use for language C<$lang>. Returns C if collation is unsupported. =cut ###################################################################### sub get_default_collation {} ###################################################################### =pod =item $driver = $db->get_driver_name Return the database driver name. =cut ###################################################################### sub get_driver_name { my( $self ) = @_; my $dbd = $self->{dbh}->{Driver}->{Name}; my $dbd_version = eval "return \$DBD::${dbd}::VERSION"; return ref($self)." [DBI $DBI::VERSION, DBD::$dbd $dbd_version]"; } ###################################################################### =pod =item $errstr = $db->error() Return a string describing the last SQL error. =cut ###################################################################### sub error { my( $self ) = @_; return $self->{dbh}->errstr; } ###################################################################### =pod =item $boolean = $db->retry_error() Returns a boolean for whether the database error is a retry error. =cut ###################################################################### sub retry_error { return 0; } ###################################################################### =pod =item $boolean = $db->duplicate_error() Returns a boolean for whether the database error is a duplicate error. =cut ###################################################################### sub duplicate_error { return 0; } ###################################################################### =pod =item $db->begin() Begin a transaction. =cut ###################################################################### sub begin { my( $self ) = @_; $self->{dbh}->{AutoCommit} = 0; } ###################################################################### =pod =item $db->commit() Commit the previously begun transaction. =cut ###################################################################### sub commit { my( $self ) = @_; return if $self->{dbh}->{AutoCommit}; $self->{dbh}->commit; $self->{dbh}->{AutoCommit} = 1; } ###################################################################### =pod =item $db->rollback() Rollback the partially completed transaction. =cut ###################################################################### sub rollback { my( $self ) = @_; return if $self->{dbh}->{AutoCommit}; $self->{dbh}->rollback; $self->{dbh}->{AutoCommit} = 1; } ###################################################################### =pod =item $type_info = $db->type_info( $data_type ) See L. =cut ###################################################################### sub type_info { my( $self, $data_type ) = @_; if( $data_type eq SQL_BIGINT ) { return { TYPE_NAME => "bigint", CREATE_PARAMS => "", COLUMN_SIZE => 19, }; } else { return $self->{dbh}->type_info( $data_type ); } } ###################################################################### =pod See L. =item $real_type = $db->get_column_type( $name, $data_type, $not_null, [ $length, $scale, %opts ] ) Returns a SQL column definition for C<$name> of type C<$type>, usually something like: $name $type($length,$scale) [ NOT NULL ] If C<$not_null> is C column will be set to C. C<$length> and C<$scale> control the maximum lengths of character or decimal types (see below). Other options available to refine the column definition: langid - character set/collation to use sorted - whether this column will be used to order by B is mapped to real database values by the "dblanguages" configuration option. The database may not be able to order the request column type in which case, if C is true, the database may use a substitute column type. C<$data_type> is the SQL type. The types are constants defined by this module, to import them use: use EPrints::Database qw( :sql_types ); Supported types (n = requires C<$length> argument): Character data: C, C, C. Binary data: C, C. Integer data: C, C, C, C. Floating-point data: C, C. Time data: C, C. The actual column types used will be database-specific. =cut ###################################################################### sub get_column_type { my( $self, $name, $data_type, $not_null, $length, $scale, %opts ) = @_; my $session = $self->{session}; my $repository = $session->get_repository; my $type_info = $self->type_info( $data_type ); my( $db_type, $params ) = @$type_info{ qw( TYPE_NAME CREATE_PARAMS ) }; if( !defined $db_type ) { no strict "refs"; foreach my $type (@{$EPrints::Database::EXPORT_TAGS{sql_types}}) { if( $data_type == &$type ) { EPrints::abort( "DBI driver does not appear to support $type" ); } } EPrints::abort( "Unknown SQL data type, must be one of: ".join(', ', @{$EPrints::Database::EXPORT_TAGS{sql_types}}) ); } my $type = $self->quote_identifier($name) . " " . $db_type; $params ||= ""; if( $params eq "max length" ) { EPrints::abort( "get_sql_type expected LENGTH argument for $data_type [$type]" ) unless defined $length; $type .= "($length)"; } elsif( $params eq "precision,scale" ) { EPrints::abort( "get_sql_type expected PRECISION and SCALE arguments for $data_type [$type]" ) unless defined $scale; $type .= "($length,$scale)"; } my $default = ""; if( $data_type eq SQL_VARCHAR() or $data_type eq SQL_LONGVARCHAR() or $data_type eq SQL_CLOB() ) { my $langid = $opts{langid}; if( !defined $langid ) { $langid = "en"; } my $charset = $self->get_default_charset( $langid ); if( !defined $charset ) { $charset = "UTF8"; } $type .= " CHARACTER SET ".$charset; my $collate = $self->get_default_collation( $langid ); if( defined( $collate ) ) { $type .= " COLLATE ".$collate; } $default = " DEFAULT ''" if $data_type eq SQL_VARCHAR(); } elsif ( $data_type eq SQL_TINYINT() or $data_type eq SQL_SMALLINT() or $data_type eq SQL_INTEGER() or $data_type eq SQL_BIGINT() or $data_type eq SQL_SMALLINT() or $data_type eq SQL_REAL() or $data_type eq SQL_DOUBLE() or $data_type eq SQL_DECIMAL() ) { $default = " DEFAULT 0"; } elsif ( $data_type eq SQL_DATE ) { $default = " DEFAULT '0000-00-00'"; } elsif ( $data_type eq SQL_TIME ) { $default = " DEFAULT '0000-00-00 00:00:00'"; } if( $not_null ) { $type .= " NOT NULL" . $default; } return $type; } =pod =back =head2 Basic SQL Operations =cut ###################################################################### =pod =over 4 =item $success = $db->do( $sql ) Execute the given C<$sql>. =cut ###################################################################### sub do { my( $self , $sql ) = @_; if( $self->{session}->get_repository->can_call( 'sql_adjust' ) ) { $sql = $self->{session}->get_repository->call( 'sql_adjust', $sql ); } if( $self->{debug} ) { use Time::HiRes; $self->{session}->get_repository->log( "Database execute debug (" . Time::HiRes::time() . "): $sql" ); } my $result = $self->{dbh}->do( $sql ); if( !$result ) { $self->{session}->get_repository->log( "SQL ERROR (do): $sql" ); $self->{session}->get_repository->log( "SQL ERROR (do): ".$self->{dbh}->errstr.' (#'.$self->{dbh}->err.')' ); return undef unless( $self->retry_error() ); my $ccount = 0; while( $ccount < 10 ) { ++$ccount; sleep 3; $self->{session}->get_repository->log( "Attempting DB reconnect: $ccount" ); $self->connect; if( defined $self->{dbh} ) { $result = $self->{dbh}->do( $sql ); return 1 if( defined $result ); $self->{session}->get_repository->log( "SQL ERROR (do): ".$self->{dbh}->errstr ); } } $self->{session}->get_repository->log( "Giving up after 10 tries" ); return undef; } if( defined $result ) { return 1; } return undef; } ###################################################################### =pod =item $sth = $db->prepare( $sql ) Prepare the given C<$sql> and return a handle on it. Use the C method on the returned L handle to execute the SQL: my $sth = $db->prepare_select( "SELECT 'Hello, World'" ); $sth->execute; =cut ###################################################################### sub prepare { my ( $self , $sql ) = @_; if( $self->{session}->get_repository->can_call( 'sql_adjust' ) ) { $sql = $self->{session}->get_repository->call( 'sql_adjust', $sql ); } # if( $self->{debug} ) # { # $self->{session}->get_repository->log( "Database prepare debug: $sql" ); # } my $result = $self->{dbh}->prepare( $sql ); my $ccount = 0; if( !$result ) { $self->{session}->get_repository->log( "SQL ERROR (prepare): $sql" ); $self->{session}->get_repository->log( "SQL ERROR (prepare): ".$self->{dbh}->errstr.' (#'.$self->{dbh}->err.')' ); # DB disconnect? unless( $self->retry_error() ) { EPrints::abort( $self->{dbh}->{errstr} ); } my $ccount = 0; while( $ccount < 10 ) { ++$ccount; sleep 3; $self->{session}->get_repository->log( "Attempting DB reconnect: $ccount" ); $self->connect; if( defined $self->{dbh} ) { $result = $self->{dbh}->prepare( $sql ); return $result if( defined $result ); $self->{session}->get_repository->log( "SQL ERROR (prepare): ".$self->{dbh}->errstr ); } } $self->{session}->get_repository->log( "Giving up after 10 tries" ); EPrints::abort( $self->{dbh}->{errstr} ); } return $result; } ###################################################################### =pod =item $sth = $db->prepare_select( $sql, [ %options ] ) Prepare a C