2005-05-21 10:15:39 +00:00
|
|
|
<?php
|
2005-08-14 07:18:34 +00:00
|
|
|
|
2005-09-16 12:00:23 +00:00
|
|
|
/**
|
|
|
|
|
* External database storage will use one (or more) separate connection pools
|
|
|
|
|
* from what the main wiki uses. If we load many revisions, such as when doing
|
|
|
|
|
* bulk backups or maintenance, we want to keep them around over the lifetime
|
|
|
|
|
* of the script.
|
|
|
|
|
*
|
|
|
|
|
* Associative array of LoadBalancer objects, indexed by cluster name.
|
|
|
|
|
*/
|
|
|
|
|
global $wgExternalLoadBalancers;
|
|
|
|
|
$wgExternalLoadBalancers = array();
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* One-step cache variable to hold base blobs; operations that
|
|
|
|
|
* pull multiple revisions may often pull multiple times from
|
|
|
|
|
* the same blob. By keeping the last-used one open, we avoid
|
|
|
|
|
* redundant unserialization and decompression overhead.
|
|
|
|
|
*/
|
|
|
|
|
global $wgExternalBlobCache;
|
|
|
|
|
$wgExternalBlobCache = array();
|
|
|
|
|
|
WARNING: HUGE COMMIT
Doxygen documentation update:
* Changed alls @addtogroup to @ingroup. @addtogroup adds the comment to the group description, but doesn't add the file, class, function, ... to the group like @ingroup does. See for example http://svn.wikimedia.org/doc/group__SpecialPage.html where it's impossible to see related files, classes, ... that should belong to that group.
* Added @file to file description, it seems that it should be explicitely decalred for file descriptions, otherwise doxygen will think that the comment document the first class, variabled, function, ... that is in that file.
* Removed some empty comments
* Removed some ?>
Added following groups:
* ExternalStorage
* JobQueue
* MaintenanceLanguage
One more thing: there are still a lot of warnings when generating the doc.
2008-05-20 17:13:28 +00:00
|
|
|
/**
|
|
|
|
|
* DB accessable external objects
|
|
|
|
|
* @ingroup ExternalStorage
|
|
|
|
|
*/
|
2005-05-21 10:15:39 +00:00
|
|
|
class ExternalStoreDB {
|
2005-08-14 07:18:34 +00:00
|
|
|
|
2009-03-26 13:28:22 +00:00
|
|
|
function __construct( $params = array() ) {
|
|
|
|
|
$this->mParams = $params;
|
|
|
|
|
}
|
|
|
|
|
|
2010-01-08 21:35:25 +00:00
|
|
|
/**
|
|
|
|
|
* Get a LoadBalancer for the specified cluster
|
|
|
|
|
*
|
|
|
|
|
* @param $cluster String: cluster name
|
|
|
|
|
* @return LoadBalancer object
|
|
|
|
|
*/
|
2005-08-14 07:18:34 +00:00
|
|
|
function &getLoadBalancer( $cluster ) {
|
2009-03-26 13:28:22 +00:00
|
|
|
$wiki = isset($this->mParams['wiki']) ? $this->mParams['wiki'] : false;
|
|
|
|
|
|
|
|
|
|
return wfGetLBFactory()->getExternalLB( $cluster, $wiki );
|
2005-08-14 07:18:34 +00:00
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2010-01-08 21:35:25 +00:00
|
|
|
/**
|
|
|
|
|
* Get a slave database connection for the specified cluster
|
|
|
|
|
*
|
|
|
|
|
* @param $cluster String: cluster name
|
|
|
|
|
* @return DatabaseBase object
|
|
|
|
|
*/
|
2005-08-14 07:18:34 +00:00
|
|
|
function &getSlave( $cluster ) {
|
2009-03-26 13:28:22 +00:00
|
|
|
$wiki = isset($this->mParams['wiki']) ? $this->mParams['wiki'] : false;
|
2005-08-14 07:18:34 +00:00
|
|
|
$lb =& $this->getLoadBalancer( $cluster );
|
2009-03-26 13:28:22 +00:00
|
|
|
return $lb->getConnection( DB_SLAVE, array(), $wiki );
|
2005-08-14 07:18:34 +00:00
|
|
|
}
|
|
|
|
|
|
2010-01-08 21:35:25 +00:00
|
|
|
/**
|
|
|
|
|
* Get a master database connection for the specified cluster
|
|
|
|
|
*
|
|
|
|
|
* @param $cluster String: cluster name
|
|
|
|
|
* @return DatabaseBase object
|
|
|
|
|
*/
|
2008-09-21 06:42:46 +00:00
|
|
|
function &getMaster( $cluster ) {
|
2009-03-26 13:28:22 +00:00
|
|
|
$wiki = isset($this->mParams['wiki']) ? $this->mParams['wiki'] : false;
|
2005-08-14 07:18:34 +00:00
|
|
|
$lb =& $this->getLoadBalancer( $cluster );
|
2009-03-26 13:28:22 +00:00
|
|
|
return $lb->getConnection( DB_MASTER, array(), $wiki );
|
2006-01-07 13:31:29 +00:00
|
|
|
}
|
2005-10-29 01:41:36 +00:00
|
|
|
|
2010-01-08 21:35:25 +00:00
|
|
|
/**
|
|
|
|
|
* Get the 'blobs' table name for this database
|
|
|
|
|
*
|
|
|
|
|
* @param $db DatabaseBase
|
|
|
|
|
* @return String: table name ('blobs' by default)
|
|
|
|
|
*/
|
2005-10-29 01:41:36 +00:00
|
|
|
function getTable( &$db ) {
|
|
|
|
|
$table = $db->getLBInfo( 'blobs table' );
|
|
|
|
|
if ( is_null( $table ) ) {
|
|
|
|
|
$table = 'blobs';
|
|
|
|
|
}
|
|
|
|
|
return $table;
|
|
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2006-04-19 15:46:24 +00:00
|
|
|
/**
|
|
|
|
|
* Fetch data from given URL
|
2010-01-08 21:35:25 +00:00
|
|
|
* @param $url String: an url of the form DB://cluster/id or DB://cluster/id/itemid for concatened storage.
|
2006-04-19 15:46:24 +00:00
|
|
|
*/
|
2008-09-24 18:38:25 +00:00
|
|
|
function fetchFromURL( $url ) {
|
2005-05-21 10:15:39 +00:00
|
|
|
$path = explode( '/', $url );
|
|
|
|
|
$cluster = $path[2];
|
|
|
|
|
$id = $path[3];
|
2005-08-14 07:18:34 +00:00
|
|
|
if ( isset( $path[4] ) ) {
|
|
|
|
|
$itemID = $path[4];
|
|
|
|
|
} else {
|
|
|
|
|
$itemID = false;
|
|
|
|
|
}
|
2005-05-21 10:15:39 +00:00
|
|
|
|
2005-09-16 12:00:23 +00:00
|
|
|
$ret =& $this->fetchBlob( $cluster, $id, $itemID );
|
2005-05-21 10:15:39 +00:00
|
|
|
|
2006-01-19 03:55:03 +00:00
|
|
|
if ( $itemID !== false && $ret !== false ) {
|
2005-09-16 12:00:23 +00:00
|
|
|
return $ret->getItem( $itemID );
|
|
|
|
|
}
|
|
|
|
|
return $ret;
|
|
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2005-09-16 12:00:23 +00:00
|
|
|
/**
|
|
|
|
|
* Fetch a blob item out of the database; a cache of the last-loaded
|
|
|
|
|
* blob will be kept so that multiple loads out of a multi-item blob
|
|
|
|
|
* can avoid redundant database access and decompression.
|
2006-04-19 15:46:24 +00:00
|
|
|
* @param $cluster
|
|
|
|
|
* @param $id
|
|
|
|
|
* @param $itemID
|
2005-09-16 12:00:23 +00:00
|
|
|
* @return mixed
|
2006-04-19 15:46:24 +00:00
|
|
|
* @private
|
2005-09-16 12:00:23 +00:00
|
|
|
*/
|
|
|
|
|
function &fetchBlob( $cluster, $id, $itemID ) {
|
|
|
|
|
global $wgExternalBlobCache;
|
|
|
|
|
$cacheID = ( $itemID === false ) ? "$cluster/$id" : "$cluster/$id/";
|
|
|
|
|
if( isset( $wgExternalBlobCache[$cacheID] ) ) {
|
|
|
|
|
wfDebug( "ExternalStoreDB::fetchBlob cache hit on $cacheID\n" );
|
|
|
|
|
return $wgExternalBlobCache[$cacheID];
|
|
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2005-09-16 12:00:23 +00:00
|
|
|
wfDebug( "ExternalStoreDB::fetchBlob cache miss on $cacheID\n" );
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2005-09-16 12:00:23 +00:00
|
|
|
$dbr =& $this->getSlave( $cluster );
|
2005-10-29 01:41:36 +00:00
|
|
|
$ret = $dbr->selectField( $this->getTable( $dbr ), 'blob_text', array( 'blob_id' => $id ) );
|
2006-01-19 03:55:03 +00:00
|
|
|
if ( $ret === false ) {
|
2006-03-14 00:47:58 +00:00
|
|
|
wfDebugLog( 'ExternalStoreDB', "ExternalStoreDB::fetchBlob master fallback on $cacheID\n" );
|
2006-01-19 03:55:03 +00:00
|
|
|
// Try the master
|
|
|
|
|
$dbw =& $this->getMaster( $cluster );
|
2006-03-14 00:47:58 +00:00
|
|
|
$ret = $dbw->selectField( $this->getTable( $dbw ), 'blob_text', array( 'blob_id' => $id ) );
|
|
|
|
|
if( $ret === false) {
|
|
|
|
|
wfDebugLog( 'ExternalStoreDB', "ExternalStoreDB::fetchBlob master failed to find $cacheID\n" );
|
|
|
|
|
}
|
2006-01-19 03:55:03 +00:00
|
|
|
}
|
|
|
|
|
if( $itemID !== false && $ret !== false ) {
|
2005-09-16 12:00:23 +00:00
|
|
|
// Unserialise object; caller extracts item
|
|
|
|
|
$ret = unserialize( $ret );
|
2005-08-14 07:18:34 +00:00
|
|
|
}
|
2006-01-07 13:31:29 +00:00
|
|
|
|
2005-09-16 12:00:23 +00:00
|
|
|
$wgExternalBlobCache = array( $cacheID => &$ret );
|
2005-05-21 10:15:39 +00:00
|
|
|
return $ret;
|
|
|
|
|
}
|
|
|
|
|
|
2005-08-14 07:18:34 +00:00
|
|
|
/**
|
|
|
|
|
* Insert a data item into a given cluster
|
|
|
|
|
*
|
2006-04-19 15:46:24 +00:00
|
|
|
* @param $cluster String: the cluster name
|
|
|
|
|
* @param $data String: the data item
|
2005-08-14 07:18:34 +00:00
|
|
|
* @return string URL
|
2005-05-21 10:15:39 +00:00
|
|
|
*/
|
2008-09-21 06:42:46 +00:00
|
|
|
function store( $cluster, $data ) {
|
2008-09-24 18:38:25 +00:00
|
|
|
$dbw = $this->getMaster( $cluster );
|
2005-08-14 07:18:34 +00:00
|
|
|
$id = $dbw->nextSequenceValue( 'blob_blob_id_seq' );
|
2008-09-24 18:38:25 +00:00
|
|
|
$dbw->insert( $this->getTable( $dbw ),
|
|
|
|
|
array( 'blob_id' => $id, 'blob_text' => $data ),
|
|
|
|
|
__METHOD__ );
|
2006-01-09 03:16:56 +00:00
|
|
|
$id = $dbw->insertId();
|
2009-04-30 06:00:01 +00:00
|
|
|
if ( !$id ) {
|
|
|
|
|
throw new MWException( __METHOD__.': no insert ID' );
|
|
|
|
|
}
|
2006-01-09 03:16:56 +00:00
|
|
|
if ( $dbw->getFlag( DBO_TRX ) ) {
|
2009-12-14 23:05:35 +00:00
|
|
|
$dbw->commit();
|
2006-01-09 03:16:56 +00:00
|
|
|
}
|
|
|
|
|
return "DB://$cluster/$id";
|
2005-08-14 07:18:34 +00:00
|
|
|
}
|
2005-05-21 10:15:39 +00:00
|
|
|
}
|