wiki.techinc.nl/includes/db/MWLBFactory.php
daniel aa7fada9dc Avoid errors in CLI mode when user has no name
MWLBFactory tries to determine the current user's name using
posix_getpwuid(). This will however fail if the current user has no
name, which is the case when running in our standard docker environment.

Bug: T283191
Change-Id: If814d791ee7061d8632ae04602cf489b06422eee
2021-05-19 17:46:49 +00:00

454 lines
16 KiB
PHP

<?php
/**
* Generator of database load balancing objects.
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
* http://www.gnu.org/copyleft/gpl.html
*
* @file
* @ingroup Database
*/
use MediaWiki\Config\ServiceOptions;
use MediaWiki\Logger\LoggerFactory;
use Wikimedia\Rdbms\ChronologyProtector;
use Wikimedia\Rdbms\DatabaseDomain;
use Wikimedia\Rdbms\IDatabase;
use Wikimedia\Rdbms\ILBFactory;
use Wikimedia\Rdbms\LBFactory;
use Wikimedia\RequestTimeout\CriticalSectionProvider;
/**
* MediaWiki-specific class for generating database load balancers
*
* @internal For use by core ServiceWiring only.
* @ingroup Database
*/
abstract class MWLBFactory {
/** @var array Cache of already-logged deprecation messages */
private static $loggedDeprecations = [];
/**
* @internal For use by ServiceWiring
*/
public const APPLY_DEFAULT_CONFIG_OPTIONS = [
'DBcompress',
'DBDefaultGroup',
'DBmwschema',
'DBname',
'DBpassword',
'DBport',
'DBprefix',
'DBserver',
'DBservers',
'DBssl',
'DBtype',
'DBuser',
'DebugDumpSql',
'DebugLogFile',
'DebugToolbar',
'ExternalServers',
'SQLiteDataDir',
'SQLMode',
];
/**
* @param array $lbConf Config for LBFactory::__construct()
* @param ServiceOptions $options
* @param ConfiguredReadOnlyMode $readOnlyMode
* @param BagOStuff $cpStash
* @param BagOStuff $srvCache
* @param WANObjectCache $wanCache
* @param CriticalSectionProvider $csProvider
* @return array
* @internal For use with service wiring
*/
public static function applyDefaultConfig(
array $lbConf,
ServiceOptions $options,
ConfiguredReadOnlyMode $readOnlyMode,
BagOStuff $cpStash,
BagOStuff $srvCache,
WANObjectCache $wanCache,
CriticalSectionProvider $csProvider
) {
$options->assertRequiredOptions( self::APPLY_DEFAULT_CONFIG_OPTIONS );
global $wgCommandLineMode;
$typesWithSchema = self::getDbTypesWithSchemas();
$lbConf += [
'localDomain' => new DatabaseDomain(
$options->get( 'DBname' ),
$options->get( 'DBmwschema' ),
$options->get( 'DBprefix' )
),
'profiler' => static function ( $section ) {
return Profiler::instance()->scopedProfileIn( $section );
},
'trxProfiler' => Profiler::instance()->getTransactionProfiler(),
'replLogger' => LoggerFactory::getInstance( 'DBReplication' ),
'queryLogger' => LoggerFactory::getInstance( 'DBQuery' ),
'connLogger' => LoggerFactory::getInstance( 'DBConnection' ),
'perfLogger' => LoggerFactory::getInstance( 'DBPerformance' ),
'errorLogger' => [ MWExceptionHandler::class, 'logException' ],
'deprecationLogger' => [ static::class, 'logDeprecation' ],
'cliMode' => $wgCommandLineMode,
'readOnlyReason' => $readOnlyMode->getReason(),
'defaultGroup' => $options->get( 'DBDefaultGroup' ),
'criticalSectionProvider' => $csProvider
];
$serversCheck = [];
// When making changes here, remember to also specify MediaWiki-specific options
// for Database classes in the relevant Installer subclass.
// Such as MysqlInstaller::openConnection and PostgresInstaller::openConnectionWithParams.
if ( $lbConf['class'] === Wikimedia\Rdbms\LBFactorySimple::class ) {
if ( isset( $lbConf['servers'] ) ) {
// Server array is already explicitly configured
} elseif ( is_array( $options->get( 'DBservers' ) ) ) {
$lbConf['servers'] = [];
foreach ( $options->get( 'DBservers' ) as $i => $server ) {
$lbConf['servers'][$i] = self::initServerInfo( $server, $options );
}
} else {
$server = self::initServerInfo(
[
'host' => $options->get( 'DBserver' ),
'user' => $options->get( 'DBuser' ),
'password' => $options->get( 'DBpassword' ),
'dbname' => $options->get( 'DBname' ),
'type' => $options->get( 'DBtype' ),
'load' => 1
],
$options
);
$server['flags'] |= $options->get( 'DBssl' ) ? DBO_SSL : 0;
$server['flags'] |= $options->get( 'DBcompress' ) ? DBO_COMPRESS : 0;
$lbConf['servers'] = [ $server ];
}
if ( !isset( $lbConf['externalClusters'] ) ) {
$lbConf['externalClusters'] = $options->get( 'ExternalServers' );
}
$serversCheck = $lbConf['servers'];
} elseif ( $lbConf['class'] === Wikimedia\Rdbms\LBFactoryMulti::class ) {
if ( isset( $lbConf['serverTemplate'] ) ) {
if ( in_array( $lbConf['serverTemplate']['type'], $typesWithSchema, true ) ) {
$lbConf['serverTemplate']['schema'] = $options->get( 'DBmwschema' );
}
$lbConf['serverTemplate']['sqlMode'] = $options->get( 'SQLMode' );
$serversCheck = [ $lbConf['serverTemplate'] ];
}
}
self::assertValidServerConfigs(
$serversCheck,
$options->get( 'DBname' ),
$options->get( 'DBprefix' )
);
$lbConf['cpStash'] = $cpStash;
$lbConf['srvCache'] = $srvCache;
$lbConf['wanCache'] = $wanCache;
return $lbConf;
}
/**
* @return array
*/
private static function getDbTypesWithSchemas() {
return [ 'postgres' ];
}
/**
* @param array $server
* @param ServiceOptions $options
* @return array
*/
private static function initServerInfo( array $server, ServiceOptions $options ) {
if ( $server['type'] === 'sqlite' ) {
$httpMethod = $_SERVER['REQUEST_METHOD'] ?? null;
// T93097: hint for how file-based databases (e.g. sqlite) should go about locking.
// See https://www.sqlite.org/lang_transaction.html
// See https://www.sqlite.org/lockingv3.html#shared_lock
$isHttpRead = in_array( $httpMethod, [ 'GET', 'HEAD', 'OPTIONS', 'TRACE' ] );
if ( MW_ENTRY_POINT === 'rest' && !$isHttpRead ) {
// Hack to support some re-entrant invocations using sqlite
// See: T259685, T91820
$request = \MediaWiki\Rest\EntryPoint::getMainRequest();
if ( $request->hasHeader( 'Promise-Non-Write-API-Action' ) ) {
$isHttpRead = true;
}
}
$server += [
'dbDirectory' => $options->get( 'SQLiteDataDir' ),
'trxMode' => $isHttpRead ? 'DEFERRED' : 'IMMEDIATE'
];
} elseif ( $server['type'] === 'postgres' ) {
$server += [ 'port' => $options->get( 'DBport' ) ];
}
if ( in_array( $server['type'], self::getDbTypesWithSchemas(), true ) ) {
$server += [ 'schema' => $options->get( 'DBmwschema' ) ];
}
$flags = $server['flags'] ?? DBO_DEFAULT;
if ( $options->get( 'DebugDumpSql' )
|| $options->get( 'DebugLogFile' )
|| $options->get( 'DebugToolbar' )
) {
$flags |= DBO_DEBUG;
}
$server['flags'] = $flags;
$server += [
'tablePrefix' => $options->get( 'DBprefix' ),
'sqlMode' => $options->get( 'SQLMode' ),
];
return $server;
}
/**
* @param array $servers
* @param string $ldDB Local domain database name
* @param string $ldTP Local domain prefix
*/
private static function assertValidServerConfigs( array $servers, $ldDB, $ldTP ) {
foreach ( $servers as $server ) {
$type = $server['type'] ?? null;
$srvDB = $server['dbname'] ?? null; // server DB
$srvTP = $server['tablePrefix'] ?? ''; // server table prefix
if ( $type === 'mysql' ) {
// A DB name is not needed to connect to mysql; 'dbname' is useless.
// This field only defines the DB to use for unspecified DB domains.
if ( $srvDB !== null && $srvDB !== $ldDB ) {
self::reportMismatchedDBs( $srvDB, $ldDB );
}
} elseif ( $type === 'postgres' ) {
if ( $srvTP !== '' ) {
self::reportIfPrefixSet( $srvTP, $type );
}
}
if ( $srvTP !== '' && $srvTP !== $ldTP ) {
self::reportMismatchedPrefixes( $srvTP, $ldTP );
}
}
}
/**
* @param string $prefix Table prefix
* @param string $dbType Database type
*/
private static function reportIfPrefixSet( $prefix, $dbType ) {
$e = new UnexpectedValueException(
"\$wgDBprefix is set to '$prefix' but the database type is '$dbType'. " .
"MediaWiki does not support using a table prefix with this RDBMS type."
);
MWExceptionRenderer::output( $e, MWExceptionRenderer::AS_PRETTY );
exit;
}
/**
* @param string $srvDB Server config database
* @param string $ldDB Local DB domain database
*/
private static function reportMismatchedDBs( $srvDB, $ldDB ) {
$e = new UnexpectedValueException(
"\$wgDBservers has dbname='$srvDB' but \$wgDBname='$ldDB'. " .
"Set \$wgDBname to the database used by this wiki project. " .
"There is rarely a need to set 'dbname' in \$wgDBservers. " .
"Cross-wiki database access, use of WikiMap::getCurrentWikiDbDomain(), " .
"use of Database::getDomainId(), and other features are not reliable when " .
"\$wgDBservers does not match the local wiki database/prefix."
);
MWExceptionRenderer::output( $e, MWExceptionRenderer::AS_PRETTY );
exit;
}
/**
* @param string $srvTP Server config table prefix
* @param string $ldTP Local DB domain database
*/
private static function reportMismatchedPrefixes( $srvTP, $ldTP ) {
$e = new UnexpectedValueException(
"\$wgDBservers has tablePrefix='$srvTP' but \$wgDBprefix='$ldTP'. " .
"Set \$wgDBprefix to the table prefix used by this wiki project. " .
"There is rarely a need to set 'tablePrefix' in \$wgDBservers. " .
"Cross-wiki database access, use of WikiMap::getCurrentWikiDbDomain(), " .
"use of Database::getDomainId(), and other features are not reliable when " .
"\$wgDBservers does not match the local wiki database/prefix."
);
MWExceptionRenderer::output( $e, MWExceptionRenderer::AS_PRETTY );
exit;
}
/**
* Decide which LBFactory class to use.
*
* @internal For use by ServiceWiring
* @param array $config (e.g. $wgLBFactoryConf)
* @return string Class name
*/
public static function getLBFactoryClass( array $config ) {
$compat = [
// For LocalSettings.php compat after removing underscores (since 1.23).
'LBFactory_Single' => Wikimedia\Rdbms\LBFactorySingle::class,
'LBFactory_Simple' => Wikimedia\Rdbms\LBFactorySimple::class,
'LBFactory_Multi' => Wikimedia\Rdbms\LBFactoryMulti::class,
// For LocalSettings.php compat after moving classes to namespaces (since 1.29).
'LBFactorySingle' => Wikimedia\Rdbms\LBFactorySingle::class,
'LBFactorySimple' => Wikimedia\Rdbms\LBFactorySimple::class,
'LBFactoryMulti' => Wikimedia\Rdbms\LBFactoryMulti::class
];
$class = $config['class'];
return $compat[$class] ?? $class;
}
/**
* @param ILBFactory $lbFactory
*/
public static function setDomainAliases( ILBFactory $lbFactory ) {
$domain = DatabaseDomain::newFromId( $lbFactory->getLocalDomainID() );
// For compatibility with hyphenated $wgDBname values on older wikis, handle callers
// that assume corresponding database domain IDs and wiki IDs have identical values
$rawLocalDomain = strlen( $domain->getTablePrefix() )
? "{$domain->getDatabase()}-{$domain->getTablePrefix()}"
: (string)$domain->getDatabase();
$lbFactory->setDomainAliases( [ $rawLocalDomain => $domain ] );
}
/**
* Apply global state from the current web request or other PHP process.
*
* This technically violates the principle constraint on ServiceWiring to be
* deterministic for a given site configuration. The exemption made here
* is solely to aid in debugging and influence non-nominal behaviour such
* as ChronologyProtector. That is, the state applied here must never change
* the logical destination or meaning of any database-related methods, it
* merely applies preferences and debugging information.
*
* The code here must be non-essential, with LBFactory behaving the same toward
* its consumers regardless of whether this is applied or not.
*
* For example, something may instantiate LBFactory for the current wiki without
* calling this, and its consumers must not be able to tell the difference.
* Likewise, in the future MediaWiki may instantiate service wiring and LBFactory
* for a foreign wiki in the same farm and apply the current global state to that,
* and that should be fine as well.
*
* @param ILBFactory $lbFactory
* @param Config $config
* @param IBufferingStatsdDataFactory $stats
*/
public static function applyGlobalState(
ILBFactory $lbFactory,
Config $config,
IBufferingStatsdDataFactory $stats
) : void {
// Use the global WebRequest singleton. The main reason for using this
// is to call WebRequest::getIP() which is non-trivial to reproduce statically
// because it needs $wgUsePrivateIPs, as well as ProxyLookup and HookRunner services.
// TODO: Create a static version of WebRequest::getIP that accepts these three
// as dependencies, and then call that here. The other uses of $req below can
// trivially use $_COOKIES, $_GET and $_SERVER instead.
$req = RequestContext::getMain()->getRequest();
// Set user IP/agent information for agent session consistency purposes
$reqStart = (int)( $_SERVER['REQUEST_TIME_FLOAT'] ?? time() );
$cpPosInfo = LBFactory::getCPInfoFromCookieValue(
// The cookie has no prefix and is set by MediaWiki::preOutputCommit()
$req->getCookie( 'cpPosIndex', '' ),
// Mitigate broken client-side cookie expiration handling (T190082)
$reqStart - ChronologyProtector::POSITION_COOKIE_TTL
);
$lbFactory->setRequestInfo( [
'IPAddress' => $req->getIP(),
'UserAgent' => $req->getHeader( 'User-Agent' ),
'ChronologyProtection' => $req->getHeader( 'MediaWiki-Chronology-Protection' ),
'ChronologyPositionIndex' => $req->getInt( 'cpPosIndex', $cpPosInfo['index'] ),
'ChronologyClientId' => $cpPosInfo['clientId']
?? $req->getHeader( 'MediaWiki-Chronology-Client-Id' )
] );
if ( $config->get( 'CommandLineMode' ) ) {
// Add a comment for easy SHOW PROCESSLIST interpretation
// TODO: For web requests this is still handled eagerly in MediaWiki.php.
if ( function_exists( 'posix_getpwuid' ) ) {
$uid = posix_geteuid();
// NOTE: posix_getpwuid will return false if the current user has no name,
// which is common when running inside a Docker container.
$pwuid = posix_getpwuid( $uid );
$agent = $pwuid['name'] ?? "uid:$uid";
} else {
$agent = 'sysadmin';
}
$agent .= '@' . wfHostname();
$lbFactory->setAgentName(
mb_strlen( $agent ) > 15 ? mb_substr( $agent, 0, 15 ) . '...' : $agent
);
// Disable buffering and delaying of DeferredUpdates and stats
// for maintenance scripts and PHPUnit tests.
// Hook into period lag checks which often happen in long-running scripts
$lbFactory->setWaitForReplicationListener(
__METHOD__,
static function () use ( $stats, $config ) {
DeferredUpdates::tryOpportunisticExecute( 'run' );
// Try to periodically flush buffered metrics to avoid OOMs
MediaWiki::emitBufferedStatsdData( $stats, $config );
}
);
// Check for other windows to run them. A script may read or do a few writes
// to the master but mostly be writing to something else, like a file store.
$lbFactory->getMainLB()->setTransactionListener(
__METHOD__,
static function ( $trigger ) use ( $stats, $config ) {
if ( $trigger === IDatabase::TRIGGER_COMMIT ) {
DeferredUpdates::tryOpportunisticExecute( 'run' );
}
// Try to periodically flush buffered metrics to avoid OOMs
MediaWiki::emitBufferedStatsdData( $stats, $config );
}
);
}
}
/**
* Log a database deprecation warning
*
* @param string $msg Deprecation message
*/
public static function logDeprecation( $msg ) {
if ( isset( self::$loggedDeprecations[$msg] ) ) {
return;
}
self::$loggedDeprecations[$msg] = true;
MWDebug::sendRawDeprecated( $msg, true, wfGetCaller() );
}
}