This can be used by WANObjectCache or statsd metrics to estimate the size of objects and network commands without having to do an extra serialization round. Change-Id: I7b1b787bba39a21e2e04262e77ee7ae24e88f8ca
568 lines
20 KiB
PHP
568 lines
20 KiB
PHP
<?php
|
|
/**
|
|
* Copyright © 2003-2004 Brion Vibber <brion@pobox.com>
|
|
* https://www.mediawiki.org/
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
* http://www.gnu.org/copyleft/gpl.html
|
|
*
|
|
* @file
|
|
* @ingroup Cache
|
|
*/
|
|
|
|
/**
|
|
* @defgroup Cache Cache
|
|
*/
|
|
|
|
use Psr\Log\LoggerAwareInterface;
|
|
use Psr\Log\LoggerInterface;
|
|
use Psr\Log\NullLogger;
|
|
use Wikimedia\LightweightObjectStore\ExpirationAwareness;
|
|
use Wikimedia\LightweightObjectStore\StorageAwareness;
|
|
use Wikimedia\ScopedCallback;
|
|
|
|
/**
|
|
* Class representing a cache/ephemeral data store
|
|
*
|
|
* This interface is intended to be more or less compatible with the PHP memcached client.
|
|
*
|
|
* Instances of this class should be created with an intended access scope, such as:
|
|
* - a) A single PHP thread on a server (e.g. stored in a PHP variable)
|
|
* - b) A single application server (e.g. stored in APC or sqlite)
|
|
* - c) All application servers in datacenter (e.g. stored in memcached or mysql)
|
|
* - d) All application servers in all datacenters (e.g. stored via mcrouter or dynomite)
|
|
*
|
|
* Callers should use the proper factory methods that yield BagOStuff instances. Site admins
|
|
* should make sure the configuration for those factory methods matches their access scope.
|
|
* BagOStuff subclasses have widely varying levels of support for replication features.
|
|
*
|
|
* For any given instance, methods like lock(), unlock(), merge(), and set() with WRITE_SYNC
|
|
* should semantically operate over its entire access scope; any nodes/threads in that scope
|
|
* should serialize appropriately when using them. Likewise, a call to get() with READ_LATEST
|
|
* from one node in its access scope should reflect the prior changes of any other node its
|
|
* access scope. Any get() should reflect the changes of any prior set() with WRITE_SYNC.
|
|
*
|
|
* Subclasses should override the default "segmentationSize" field with an appropriate value.
|
|
* The value should not be larger than what the storage backend (by default) supports. It also
|
|
* should be roughly informed by common performance bottlenecks (e.g. values over a certain size
|
|
* having poor scalability). The same goes for the "segmentedValueMaxSize" member, which limits
|
|
* the maximum size and chunk count (indirectly) of values.
|
|
*
|
|
* @ingroup Cache
|
|
*/
|
|
abstract class BagOStuff implements
|
|
ExpirationAwareness,
|
|
StorageAwareness,
|
|
IStoreKeyEncoder,
|
|
LoggerAwareInterface
|
|
{
|
|
/** @var LoggerInterface */
|
|
protected $logger;
|
|
|
|
/** @var callable|null */
|
|
protected $asyncHandler;
|
|
/** @var int[] Map of (ATTR_* class constant => QOS_* class constant) */
|
|
protected $attrMap = [];
|
|
|
|
/** @var bool */
|
|
protected $debugMode = false;
|
|
|
|
/** @var float|null */
|
|
private $wallClockOverride;
|
|
|
|
/** Bitfield constants for get()/getMulti(); these are only advisory */
|
|
const READ_LATEST = 1; // if supported, avoid reading stale data due to replication
|
|
const READ_VERIFIED = 2; // promise that the caller handles detection of staleness
|
|
/** Bitfield constants for set()/merge(); these are only advisory */
|
|
const WRITE_SYNC = 4; // if supported, block until the write is fully replicated
|
|
const WRITE_CACHE_ONLY = 8; // only change state of the in-memory cache
|
|
const WRITE_ALLOW_SEGMENTS = 16; // allow partitioning of the value if it is large
|
|
const WRITE_PRUNE_SEGMENTS = 32; // delete all the segments if the value is partitioned
|
|
const WRITE_BACKGROUND = 64; // if supported, do not block on completion until the next read
|
|
|
|
/**
|
|
* Parameters include:
|
|
* - logger: Psr\Log\LoggerInterface instance
|
|
* - asyncHandler: Callable to use for scheduling tasks after the web request ends.
|
|
* In CLI mode, it should run the task immediately.
|
|
* @param array $params
|
|
* @phan-param array{logger?:Psr\Log\LoggerInterface,asyncHandler?:callable} $params
|
|
*/
|
|
public function __construct( array $params = [] ) {
|
|
$this->setLogger( $params['logger'] ?? new NullLogger() );
|
|
$this->asyncHandler = $params['asyncHandler'] ?? null;
|
|
}
|
|
|
|
/**
|
|
* @param LoggerInterface $logger
|
|
* @return void
|
|
*/
|
|
public function setLogger( LoggerInterface $logger ) {
|
|
$this->logger = $logger;
|
|
}
|
|
|
|
/**
|
|
* @since 1.35
|
|
* @return LoggerInterface
|
|
*/
|
|
public function getLogger() : LoggerInterface {
|
|
return $this->logger;
|
|
}
|
|
|
|
/**
|
|
* @param bool $enabled
|
|
*/
|
|
public function setDebug( $enabled ) {
|
|
$this->debugMode = $enabled;
|
|
}
|
|
|
|
/**
|
|
* Get an item with the given key, regenerating and setting it if not found
|
|
*
|
|
* The callback can take $exptime as argument by reference and modify it.
|
|
* Nothing is stored nor deleted if the callback returns false.
|
|
*
|
|
* @param string $key
|
|
* @param int $exptime Time-to-live (seconds)
|
|
* @param callable $callback Callback that derives the new value
|
|
* @param int $flags Bitfield of BagOStuff::READ_* or BagOStuff::WRITE_* constants [optional]
|
|
* @return mixed The cached value if found or the result of $callback otherwise
|
|
* @since 1.27
|
|
*/
|
|
final public function getWithSetCallback( $key, $exptime, $callback, $flags = 0 ) {
|
|
$value = $this->get( $key, $flags );
|
|
|
|
if ( $value === false ) {
|
|
$value = $callback( $exptime );
|
|
if ( $value !== false && $exptime >= 0 ) {
|
|
$this->set( $key, $value, $exptime, $flags );
|
|
}
|
|
}
|
|
|
|
return $value;
|
|
}
|
|
|
|
/**
|
|
* Get an item with the given key
|
|
*
|
|
* If the key includes a deterministic input hash (e.g. the key can only have
|
|
* the correct value) or complete staleness checks are handled by the caller
|
|
* (e.g. nothing relies on the TTL), then the READ_VERIFIED flag should be set.
|
|
* This lets tiered backends know they can safely upgrade a cached value to
|
|
* higher tiers using standard TTLs.
|
|
*
|
|
* @param string $key
|
|
* @param int $flags Bitfield of BagOStuff::READ_* constants [optional]
|
|
* @return mixed Returns false on failure or if the item does not exist
|
|
*/
|
|
abstract public function get( $key, $flags = 0 );
|
|
|
|
/**
|
|
* Set an item
|
|
*
|
|
* @param string $key
|
|
* @param mixed $value
|
|
* @param int $exptime Either an interval in seconds or a unix timestamp for expiry
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants
|
|
* @return bool Success
|
|
*/
|
|
abstract public function set( $key, $value, $exptime = 0, $flags = 0 );
|
|
|
|
/**
|
|
* Delete an item
|
|
*
|
|
* For large values written using WRITE_ALLOW_SEGMENTS, this only deletes the main
|
|
* segment list key unless WRITE_PRUNE_SEGMENTS is in the flags. While deleting the segment
|
|
* list key has the effect of functionally deleting the key, it leaves unused blobs in cache.
|
|
*
|
|
* @param string $key
|
|
* @return bool True if the item was deleted or not found, false on failure
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants
|
|
*/
|
|
abstract public function delete( $key, $flags = 0 );
|
|
|
|
/**
|
|
* Insert an item if it does not already exist
|
|
*
|
|
* @param string $key
|
|
* @param mixed $value
|
|
* @param int $exptime
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants (since 1.33)
|
|
* @return bool Success
|
|
*/
|
|
abstract public function add( $key, $value, $exptime = 0, $flags = 0 );
|
|
|
|
/**
|
|
* Merge changes into the existing cache value (possibly creating a new one)
|
|
*
|
|
* The callback function returns the new value given the current value
|
|
* (which will be false if not present), and takes the arguments:
|
|
* (this BagOStuff, cache key, current value, TTL).
|
|
* The TTL parameter is reference set to $exptime. It can be overriden in the callback.
|
|
* Nothing is stored nor deleted if the callback returns false.
|
|
*
|
|
* @param string $key
|
|
* @param callable $callback Callback method to be executed
|
|
* @param int $exptime Either an interval in seconds or a unix timestamp for expiry
|
|
* @param int $attempts The amount of times to attempt a merge in case of failure
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants
|
|
* @return bool Success
|
|
* @throws InvalidArgumentException
|
|
*/
|
|
abstract public function merge(
|
|
$key,
|
|
callable $callback,
|
|
$exptime = 0,
|
|
$attempts = 10,
|
|
$flags = 0
|
|
);
|
|
|
|
/**
|
|
* Change the expiration on a key if it exists
|
|
*
|
|
* If an expiry in the past is given then the key will immediately be expired
|
|
*
|
|
* For large values written using WRITE_ALLOW_SEGMENTS, this only changes the TTL of the
|
|
* main segment list key. While lowering the TTL of the segment list key has the effect of
|
|
* functionally lowering the TTL of the key, it might leave unused blobs in cache for longer.
|
|
* Raising the TTL of such keys is not effective, since the expiration of a single segment
|
|
* key effectively expires the entire value.
|
|
*
|
|
* @param string $key
|
|
* @param int $exptime TTL or UNIX timestamp
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants (since 1.33)
|
|
* @return bool Success Returns false on failure or if the item does not exist
|
|
* @since 1.28
|
|
*/
|
|
abstract public function changeTTL( $key, $exptime = 0, $flags = 0 );
|
|
|
|
/**
|
|
* Acquire an advisory lock on a key string
|
|
*
|
|
* Note that if reentry is enabled, duplicate calls ignore $expiry
|
|
*
|
|
* @param string $key
|
|
* @param int $timeout Lock wait timeout; 0 for non-blocking [optional]
|
|
* @param int $expiry Lock expiry [optional]; 1 day maximum
|
|
* @param string $rclass Allow reentry if set and the current lock used this value
|
|
* @return bool Success
|
|
*/
|
|
abstract public function lock( $key, $timeout = 6, $expiry = 6, $rclass = '' );
|
|
|
|
/**
|
|
* Release an advisory lock on a key string
|
|
*
|
|
* @param string $key
|
|
* @return bool Success
|
|
*/
|
|
abstract public function unlock( $key );
|
|
|
|
/**
|
|
* Get a lightweight exclusive self-unlocking lock
|
|
*
|
|
* Note that the same lock cannot be acquired twice.
|
|
*
|
|
* This is useful for task de-duplication or to avoid obtrusive
|
|
* (though non-corrupting) DB errors like INSERT key conflicts
|
|
* or deadlocks when using LOCK IN SHARE MODE.
|
|
*
|
|
* @param string $key
|
|
* @param int $timeout Lock wait timeout; 0 for non-blocking [optional]
|
|
* @param int $expiry Lock expiry [optional]; 1 day maximum
|
|
* @param string $rclass Allow reentry if set and the current lock used this value
|
|
* @return ScopedCallback|null Returns null on failure
|
|
* @since 1.26
|
|
*/
|
|
final public function getScopedLock( $key, $timeout = 6, $expiry = 30, $rclass = '' ) {
|
|
$expiry = min( $expiry ?: INF, self::TTL_DAY );
|
|
|
|
if ( !$this->lock( $key, $timeout, $expiry, $rclass ) ) {
|
|
return null;
|
|
}
|
|
|
|
$lSince = $this->getCurrentTime(); // lock timestamp
|
|
|
|
return new ScopedCallback( function () use ( $key, $lSince, $expiry ) {
|
|
$latency = 0.050; // latency skew (err towards keeping lock present)
|
|
$age = ( $this->getCurrentTime() - $lSince + $latency );
|
|
if ( ( $age + $latency ) >= $expiry ) {
|
|
$this->logger->warning(
|
|
"Lock for {key} held too long ({age} sec).",
|
|
[ 'key' => $key, 'age' => $age ]
|
|
);
|
|
return; // expired; it's not "safe" to delete the key
|
|
}
|
|
$this->unlock( $key );
|
|
} );
|
|
}
|
|
|
|
/**
|
|
* Delete all objects expiring before a certain date.
|
|
* @param string|int $timestamp The reference date in MW or TS_UNIX format
|
|
* @param callable|null $progress Optional, a function which will be called
|
|
* regularly during long-running operations with the percentage progress
|
|
* as the first parameter. [optional]
|
|
* @param int $limit Maximum number of keys to delete [default: INF]
|
|
*
|
|
* @return bool Success; false if unimplemented
|
|
*/
|
|
abstract public function deleteObjectsExpiringBefore(
|
|
$timestamp,
|
|
callable $progress = null,
|
|
$limit = INF
|
|
);
|
|
|
|
/**
|
|
* Get an associative array containing the item for each of the keys that have items.
|
|
* @param string[] $keys List of keys
|
|
* @param int $flags Bitfield; supports READ_LATEST [optional]
|
|
* @return mixed[] Map of (key => value) for existing keys
|
|
*/
|
|
abstract public function getMulti( array $keys, $flags = 0 );
|
|
|
|
/**
|
|
* Batch insertion/replace
|
|
*
|
|
* This does not support WRITE_ALLOW_SEGMENTS to avoid excessive read I/O
|
|
*
|
|
* WRITE_BACKGROUND can be used for bulk insertion where the response is not vital
|
|
*
|
|
* @param mixed[] $data Map of (key => value)
|
|
* @param int $exptime Either an interval in seconds or a unix timestamp for expiry
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants (since 1.33)
|
|
* @return bool Success
|
|
* @since 1.24
|
|
*/
|
|
abstract public function setMulti( array $data, $exptime = 0, $flags = 0 );
|
|
|
|
/**
|
|
* Batch deletion
|
|
*
|
|
* This does not support WRITE_ALLOW_SEGMENTS to avoid excessive read I/O
|
|
*
|
|
* WRITE_BACKGROUND can be used for bulk deletion where the response is not vital
|
|
*
|
|
* @param string[] $keys List of keys
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants
|
|
* @return bool Success
|
|
* @since 1.33
|
|
*/
|
|
abstract public function deleteMulti( array $keys, $flags = 0 );
|
|
|
|
/**
|
|
* Change the expiration of multiple keys that exist
|
|
*
|
|
* @see BagOStuff::changeTTL()
|
|
*
|
|
* @param string[] $keys List of keys
|
|
* @param int $exptime TTL or UNIX timestamp
|
|
* @param int $flags Bitfield of BagOStuff::WRITE_* constants (since 1.33)
|
|
* @return bool Success
|
|
* @since 1.34
|
|
*/
|
|
abstract public function changeTTLMulti( array $keys, $exptime, $flags = 0 );
|
|
|
|
/**
|
|
* Increase stored value of $key by $value while preserving its TTL
|
|
* @param string $key Key to increase
|
|
* @param int $value Value to add to $key (default: 1) [optional]
|
|
* @param int $flags Bit field of class WRITE_* constants [optional]
|
|
* @return int|bool New value or false on failure
|
|
*/
|
|
abstract public function incr( $key, $value = 1, $flags = 0 );
|
|
|
|
/**
|
|
* Decrease stored value of $key by $value while preserving its TTL
|
|
* @param string $key
|
|
* @param int $value Value to subtract from $key (default: 1) [optional]
|
|
* @param int $flags Bit field of class WRITE_* constants [optional]
|
|
* @return int|bool New value or false on failure
|
|
*/
|
|
abstract public function decr( $key, $value = 1, $flags = 0 );
|
|
|
|
/**
|
|
* Increase the value of the given key (no TTL change) if it exists or create it otherwise
|
|
*
|
|
* This will create the key with the value $init and TTL $exptime instead if not present.
|
|
* Callers should make sure that both ($init - $value) and $exptime are invariants for all
|
|
* operations to any given key. The value of $init should be at least that of $value.
|
|
*
|
|
* @param string $key Key built via makeKey() or makeGlobalKey()
|
|
* @param int $exptime Time-to-live (in seconds) or a UNIX timestamp expiration
|
|
* @param int $value Amount to increase the key value by [default: 1]
|
|
* @param int|null $init Value to initialize the key to if it does not exist [default: $value]
|
|
* @param int $flags Bit field of class WRITE_* constants [optional]
|
|
* @return int|bool New value or false on failure
|
|
* @since 1.24
|
|
*/
|
|
abstract public function incrWithInit( $key, $exptime, $value = 1, $init = null, $flags = 0 );
|
|
|
|
/**
|
|
* Get the "last error" registered; clearLastError() should be called manually
|
|
* @return int ERR_* constant for the "last error" registry
|
|
* @since 1.23
|
|
*/
|
|
abstract public function getLastError();
|
|
|
|
/**
|
|
* Clear the "last error" registry
|
|
* @since 1.23
|
|
*/
|
|
abstract public function clearLastError();
|
|
|
|
/**
|
|
* Let a callback be run to avoid wasting time on special blocking calls
|
|
*
|
|
* The callbacks may or may not be called ever, in any particular order.
|
|
* They are likely to be invoked when something WRITE_SYNC is used used.
|
|
* They should follow a caching pattern as shown below, so that any code
|
|
* using the work will get it's result no matter what happens.
|
|
* @code
|
|
* $result = null;
|
|
* $workCallback = function () use ( &$result ) {
|
|
* if ( !$result ) {
|
|
* $result = ....
|
|
* }
|
|
* return $result;
|
|
* }
|
|
* @endcode
|
|
*
|
|
* @param callable $workCallback
|
|
* @since 1.28
|
|
*/
|
|
abstract public function addBusyCallback( callable $workCallback );
|
|
|
|
/**
|
|
* Construct a cache key.
|
|
*
|
|
* @since 1.27
|
|
* @param string $keyspace
|
|
* @param array $args
|
|
* @return string Colon-delimited list of $keyspace followed by escaped components of $args
|
|
*/
|
|
abstract public function makeKeyInternal( $keyspace, $args );
|
|
|
|
/**
|
|
* Make a global cache key.
|
|
*
|
|
* @since 1.27
|
|
* @param string $class Key class
|
|
* @param string|int ...$components Key components (starting with a key collection name)
|
|
* @return string Colon-delimited list of $keyspace followed by escaped components
|
|
*/
|
|
abstract public function makeGlobalKey( $class, ...$components );
|
|
|
|
/**
|
|
* Make a cache key, scoped to this instance's keyspace.
|
|
*
|
|
* @since 1.27
|
|
* @param string $class Key class
|
|
* @param string|int ...$components Key components (starting with a key collection name)
|
|
* @return string Colon-delimited list of $keyspace followed by escaped components
|
|
*/
|
|
abstract public function makeKey( $class, ...$components );
|
|
|
|
/**
|
|
* @param int $flag ATTR_* class constant
|
|
* @return int QOS_* class constant
|
|
* @since 1.28
|
|
*/
|
|
public function getQoS( $flag ) {
|
|
return $this->attrMap[$flag] ?? self::QOS_UNKNOWN;
|
|
}
|
|
|
|
/**
|
|
* @return int|float The chunk size, in bytes, of segmented objects (INF for no limit)
|
|
* @since 1.34
|
|
*/
|
|
public function getSegmentationSize() {
|
|
return INF;
|
|
}
|
|
|
|
/**
|
|
* @return int|float Maximum total segmented object size in bytes (INF for no limit)
|
|
* @since 1.34
|
|
*/
|
|
public function getSegmentedValueMaxSize() {
|
|
return INF;
|
|
}
|
|
|
|
/**
|
|
* @param int $field
|
|
* @param int $flags
|
|
* @return bool
|
|
* @since 1.34
|
|
*/
|
|
final protected function fieldHasFlags( $field, $flags ) {
|
|
return ( ( $field & $flags ) === $flags );
|
|
}
|
|
|
|
/**
|
|
* Merge the flag maps of one or more BagOStuff objects into a "lowest common denominator" map
|
|
*
|
|
* @param BagOStuff[] $bags
|
|
* @return int[] Resulting flag map (class ATTR_* constant => class QOS_* constant)
|
|
*/
|
|
final protected function mergeFlagMaps( array $bags ) {
|
|
$map = [];
|
|
foreach ( $bags as $bag ) {
|
|
foreach ( $bag->attrMap as $attr => $rank ) {
|
|
if ( isset( $map[$attr] ) ) {
|
|
$map[$attr] = min( $map[$attr], $rank );
|
|
} else {
|
|
$map[$attr] = $rank;
|
|
}
|
|
}
|
|
}
|
|
|
|
return $map;
|
|
}
|
|
|
|
/**
|
|
* Prepare values for storage and get their serialized sizes, or, estimate those sizes
|
|
*
|
|
* This is only useful if the caller needs an estimate of the serialized object sizes.
|
|
* The caller cannot know the serialization format and even if it did, it could be expensive
|
|
* to serialize complex values twice just to get the size information before writing them to
|
|
* cache. This method solves both problems by making the cache instance do the serialization
|
|
* and having it reuse the result when the cache write happens.
|
|
*
|
|
* When using this method, the caller must invoke it for each value, in order, that will
|
|
* be passed to the next write cache instance. All previously prepared values are cleared.
|
|
*
|
|
* @param array $valuesByKey Map of (cache key => PHP variable value to serialize)
|
|
* @return int[]|null[] Corresponding serialized value size list (null for invalid values)
|
|
* @since 1.35
|
|
*/
|
|
abstract public function setNewPreparedValues( array $valuesByKey );
|
|
|
|
/**
|
|
* @internal For testing only
|
|
* @return float UNIX timestamp
|
|
* @codeCoverageIgnore
|
|
*/
|
|
public function getCurrentTime() {
|
|
return $this->wallClockOverride ?: microtime( true );
|
|
}
|
|
|
|
/**
|
|
* @internal For testing only
|
|
* @param float|null &$time Mock UNIX timestamp
|
|
* @codeCoverageIgnore
|
|
*/
|
|
public function setMockTime( &$time ) {
|
|
$this->wallClockOverride =& $time;
|
|
}
|
|
}
|