2013-01-04 09:23:26 +00:00
|
|
|
<?php
|
2012-10-18 09:33:15 +00:00
|
|
|
/**
|
|
|
|
|
* Methods to play with arrays.
|
|
|
|
|
*
|
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
* (at your option) any later version.
|
|
|
|
|
*
|
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
|
*
|
|
|
|
|
* You should have received a copy of the GNU General Public License along
|
|
|
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
|
|
|
* http://www.gnu.org/copyleft/gpl.html
|
|
|
|
|
*
|
|
|
|
|
* @file
|
|
|
|
|
*/
|
2013-01-04 09:23:26 +00:00
|
|
|
|
2012-10-18 09:33:15 +00:00
|
|
|
/**
|
|
|
|
|
* A collection of static methods to play with arrays.
|
2014-01-25 05:25:43 +00:00
|
|
|
*
|
|
|
|
|
* @since 1.21
|
2012-10-18 09:33:15 +00:00
|
|
|
*/
|
2013-01-04 09:23:26 +00:00
|
|
|
class ArrayUtils {
|
|
|
|
|
/**
|
|
|
|
|
* Sort the given array in a pseudo-random order which depends only on the
|
2016-04-18 19:09:54 +00:00
|
|
|
* given key and each element value in $array. This is typically used for load
|
2013-01-04 09:23:26 +00:00
|
|
|
* balancing between servers each with a local cache.
|
|
|
|
|
*
|
|
|
|
|
* Keys are preserved. The input array is modified in place.
|
|
|
|
|
*
|
|
|
|
|
* Note: Benchmarking on PHP 5.3 and 5.4 indicates that for small
|
|
|
|
|
* strings, md5() is only 10% slower than hash('joaat',...) etc.,
|
|
|
|
|
* since the function call overhead dominates. So there's not much
|
|
|
|
|
* justification for breaking compatibility with installations
|
|
|
|
|
* compiled with ./configure --disable-hash.
|
2013-02-03 20:05:24 +00:00
|
|
|
*
|
2017-08-11 00:23:16 +00:00
|
|
|
* @param array &$array Array to sort
|
2013-10-04 13:43:09 +00:00
|
|
|
* @param string $key
|
|
|
|
|
* @param string $separator A separator used to delimit the array elements and the
|
2013-02-03 20:05:24 +00:00
|
|
|
* key. This can be chosen to provide backwards compatibility with
|
2013-01-04 09:23:26 +00:00
|
|
|
* various consistent hash implementations that existed before this
|
|
|
|
|
* function was introduced.
|
|
|
|
|
*/
|
2013-03-05 23:05:21 +00:00
|
|
|
public static function consistentHashSort( &$array, $key, $separator = "\000" ) {
|
2016-02-17 09:09:32 +00:00
|
|
|
$hashes = [];
|
2013-01-04 09:23:26 +00:00
|
|
|
foreach ( $array as $elt ) {
|
|
|
|
|
$hashes[$elt] = md5( $elt . $separator . $key );
|
|
|
|
|
}
|
2021-02-10 22:31:02 +00:00
|
|
|
uasort( $array, static function ( $a, $b ) use ( $hashes ) {
|
2013-01-04 09:23:26 +00:00
|
|
|
return strcmp( $hashes[$a], $hashes[$b] );
|
|
|
|
|
} );
|
|
|
|
|
}
|
2013-03-05 23:05:21 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Given an array of non-normalised probabilities, this function will select
|
|
|
|
|
* an element and return the appropriate key
|
|
|
|
|
*
|
2013-10-04 13:43:09 +00:00
|
|
|
* @param array $weights
|
2022-11-09 00:11:22 +00:00
|
|
|
* @return int|string|false
|
2013-03-05 23:05:21 +00:00
|
|
|
*/
|
2013-03-24 10:01:51 +00:00
|
|
|
public static function pickRandom( $weights ) {
|
2013-03-05 23:05:21 +00:00
|
|
|
if ( !is_array( $weights ) || count( $weights ) == 0 ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$sum = array_sum( $weights );
|
|
|
|
|
if ( $sum == 0 ) {
|
|
|
|
|
# No loads on any of them
|
|
|
|
|
# In previous versions, this triggered an unweighted random selection,
|
|
|
|
|
# but this feature has been removed as of April 2006 to allow for strict
|
|
|
|
|
# separation of query groups.
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
$max = mt_getrandmax();
|
|
|
|
|
$rand = mt_rand( 0, $max ) / $max * $sum;
|
|
|
|
|
|
|
|
|
|
$sum = 0;
|
|
|
|
|
foreach ( $weights as $i => $w ) {
|
|
|
|
|
$sum += $w;
|
2013-03-05 23:18:47 +00:00
|
|
|
# Do not return keys if they have 0 weight.
|
|
|
|
|
# Note that the "all 0 weight" case is handed above
|
|
|
|
|
if ( $w > 0 && $sum >= $rand ) {
|
2013-03-05 23:05:21 +00:00
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
2013-11-04 09:29:25 +00:00
|
|
|
|
2013-03-05 23:05:21 +00:00
|
|
|
return $i;
|
|
|
|
|
}
|
2012-10-18 09:33:15 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Do a binary search, and return the index of the largest item that sorts
|
|
|
|
|
* less than or equal to the target value.
|
|
|
|
|
*
|
2014-01-25 05:25:43 +00:00
|
|
|
* @since 1.23
|
|
|
|
|
*
|
2014-11-05 21:44:43 +00:00
|
|
|
* @param callable $valueCallback A function to call to get the value with
|
2012-10-18 09:33:15 +00:00
|
|
|
* a given array index.
|
2014-01-25 05:25:43 +00:00
|
|
|
* @param int $valueCount The number of items accessible via $valueCallback,
|
2012-10-18 09:33:15 +00:00
|
|
|
* indexed from 0 to $valueCount - 1
|
2014-11-05 21:44:43 +00:00
|
|
|
* @param callable $comparisonCallback A callback to compare two values, returning
|
2012-10-18 09:33:15 +00:00
|
|
|
* -1, 0 or 1 in the style of strcmp().
|
2022-02-28 03:05:58 +00:00
|
|
|
* @param mixed $target The target value to find.
|
2012-10-18 09:33:15 +00:00
|
|
|
*
|
|
|
|
|
* @return int|bool The item index of the lower bound, or false if the target value
|
|
|
|
|
* sorts before all items.
|
|
|
|
|
*/
|
2014-05-08 19:15:09 +00:00
|
|
|
public static function findLowerBound( $valueCallback, $valueCount,
|
|
|
|
|
$comparisonCallback, $target
|
|
|
|
|
) {
|
2012-10-18 09:33:15 +00:00
|
|
|
if ( $valueCount === 0 ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$min = 0;
|
|
|
|
|
$max = $valueCount;
|
|
|
|
|
do {
|
|
|
|
|
$mid = $min + ( ( $max - $min ) >> 1 );
|
2018-06-09 23:26:32 +00:00
|
|
|
$item = $valueCallback( $mid );
|
|
|
|
|
$comparison = $comparisonCallback( $target, $item );
|
2012-10-18 09:33:15 +00:00
|
|
|
if ( $comparison > 0 ) {
|
|
|
|
|
$min = $mid;
|
|
|
|
|
} elseif ( $comparison == 0 ) {
|
|
|
|
|
$min = $mid;
|
|
|
|
|
break;
|
|
|
|
|
} else {
|
|
|
|
|
$max = $mid;
|
|
|
|
|
}
|
|
|
|
|
} while ( $min < $max - 1 );
|
|
|
|
|
|
|
|
|
|
if ( $min == 0 ) {
|
2018-06-09 23:26:32 +00:00
|
|
|
$item = $valueCallback( $min );
|
|
|
|
|
$comparison = $comparisonCallback( $target, $item );
|
2012-10-18 09:33:15 +00:00
|
|
|
if ( $comparison < 0 ) {
|
|
|
|
|
// Before the first item
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return $min;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Do array_diff_assoc() on multi-dimensional arrays.
|
|
|
|
|
*
|
|
|
|
|
* Note: empty arrays are removed.
|
|
|
|
|
*
|
2014-01-25 05:25:43 +00:00
|
|
|
* @since 1.23
|
|
|
|
|
*
|
|
|
|
|
* @param array $array1 The array to compare from
|
Get rid of unnecessary func_get_args() and friends
HHVM does not support variadic arguments with type hints. This is
mostly not a big problem, because we can just drop the type hint, but
for some reason PHPUnit adds a type hint of "array" when it creates
mocks, so a class with a variadic method can't be mocked (at least in
some cases). As such, I left alone all the classes that seem like
someone might like to mock them, like Title and User. If anyone wants
to mock them in the future, they'll have to switch back to
func_get_args(). Some of the changes are definitely safe, like
functions and test classes.
In most cases, func_get_args() (and/or func_get_arg(), func_num_args() )
were only present because the code was written before we required PHP
5.6, and writing them as variadic functions is strictly superior. In
some cases I left them alone, aside from HHVM compatibility:
* Forwarding all arguments to another function. It's useful to keep
func_get_args() here where we want to keep the list of expected
arguments and their meanings in the function signature line for
documentation purposes, but don't want to copy-paste a long line of
argument names.
* Handling deprecated calling conventions.
* One or two miscellaneous cases where we're basically using the
arguments individually but want to use them as an array as well for
some reason.
Change-Id: I066ec95a7beb7c0665146195a08e7cce1222c788
2018-10-08 14:10:45 +00:00
|
|
|
* @param array ...$arrays More arrays to compare against
|
2012-10-18 09:33:15 +00:00
|
|
|
* @return array An array containing all the values from array1
|
|
|
|
|
* that are not present in any of the other arrays.
|
|
|
|
|
*/
|
Get rid of unnecessary func_get_args() and friends
HHVM does not support variadic arguments with type hints. This is
mostly not a big problem, because we can just drop the type hint, but
for some reason PHPUnit adds a type hint of "array" when it creates
mocks, so a class with a variadic method can't be mocked (at least in
some cases). As such, I left alone all the classes that seem like
someone might like to mock them, like Title and User. If anyone wants
to mock them in the future, they'll have to switch back to
func_get_args(). Some of the changes are definitely safe, like
functions and test classes.
In most cases, func_get_args() (and/or func_get_arg(), func_num_args() )
were only present because the code was written before we required PHP
5.6, and writing them as variadic functions is strictly superior. In
some cases I left them alone, aside from HHVM compatibility:
* Forwarding all arguments to another function. It's useful to keep
func_get_args() here where we want to keep the list of expected
arguments and their meanings in the function signature line for
documentation purposes, but don't want to copy-paste a long line of
argument names.
* Handling deprecated calling conventions.
* One or two miscellaneous cases where we're basically using the
arguments individually but want to use them as an array as well for
some reason.
Change-Id: I066ec95a7beb7c0665146195a08e7cce1222c788
2018-10-08 14:10:45 +00:00
|
|
|
public static function arrayDiffAssocRecursive( $array1, ...$arrays ) {
|
2016-02-17 09:09:32 +00:00
|
|
|
$ret = [];
|
2012-10-18 09:33:15 +00:00
|
|
|
|
|
|
|
|
foreach ( $array1 as $key => $value ) {
|
|
|
|
|
if ( is_array( $value ) ) {
|
2016-02-17 09:09:32 +00:00
|
|
|
$args = [ $value ];
|
2012-10-18 09:33:15 +00:00
|
|
|
foreach ( $arrays as $array ) {
|
|
|
|
|
if ( isset( $array[$key] ) ) {
|
|
|
|
|
$args[] = $array[$key];
|
|
|
|
|
}
|
|
|
|
|
}
|
2018-06-09 23:26:32 +00:00
|
|
|
$valueret = self::arrayDiffAssocRecursive( ...$args );
|
2012-10-18 09:33:15 +00:00
|
|
|
if ( count( $valueret ) ) {
|
|
|
|
|
$ret[$key] = $valueret;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
foreach ( $arrays as $array ) {
|
|
|
|
|
if ( isset( $array[$key] ) && $array[$key] === $value ) {
|
|
|
|
|
continue 2;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
$ret[$key] = $value;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $ret;
|
|
|
|
|
}
|
Introduce $wgForceHTTPS
Add $wgForceHTTPS. When set to true:
* It makes the HTTP to HTTPS redirect unconditional and suppresses the
forceHTTPS cookie.
* It makes session cookies be secure.
* In the Action API, it triggers the existing deprecation warning and
avoids more expensive user/session checks.
* In login and signup, it suppresses the old hidden form fields for
protocol switching.
* It hides the prefershttps user preference.
Other changes:
* Factor out the HTTPS redirect in MediaWiki::main() into
maybeDoHttpsRedirect() and shouldDoHttpRedirect(). Improve
documentation.
* User::requiresHTTPS() reflects $wgForceHTTPS whereas the Session
concept of "force HTTPS" does not. The documentation of
User::requiresHTTPS() says that it includes configuration, and
retaining this definition was beneficial for some callers. Whereas
Session::shouldForceHTTPS() was used fairly narrowly as the value
of the forceHTTPS cookie, and injecting configuration into it is not
so easy or beneficial, so I left it as it was, except for clarifying
the documentation.
* Deprecate the following hooks: BeforeHttpsRedirect, UserRequiresHTTPS,
CanIPUseHTTPS. No known extension uses them, and they're not compatible
with the long-term goal of ending support for mixed-protocol wikis.
BeforeHttpsRedirect was documented as unstable from its inception.
CanIPUseHTTPS was a WMF config hack now superseded by GFOC's SNI
sniffing.
* For tests which failed with $wgForceHTTPS=true, I mostly split the
tests, testing each configuration value separately.
* Add ArrayUtils::cartesianProduct() as a helper for generating
combinations of boolean options in the session tests.
Bug: T256095
Change-Id: Iefb5ba55af35350dfc7c050f9fb8f4e8a79751cb
2020-06-24 00:56:46 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Make an array consisting of every combination of the elements of the
|
|
|
|
|
* input arrays. Each element of the output array is an array with a number
|
|
|
|
|
* of elements equal to the number of input parameters.
|
|
|
|
|
*
|
|
|
|
|
* In mathematical terms, this is an n-ary Cartesian product.
|
|
|
|
|
*
|
|
|
|
|
* For example, ArrayUtils::cartesianProduct( [ 1, 2 ], [ 'a', 'b' ] )
|
|
|
|
|
* produces [ [ 1, 'a' ], [ 1, 'b' ], [ 2, 'a' ], [ 2, 'b' ] ]
|
|
|
|
|
*
|
|
|
|
|
* If any of the input arrays is empty, the result is the empty array [].
|
|
|
|
|
* This is in keeping with the mathematical definition.
|
|
|
|
|
*
|
|
|
|
|
* If no parameters are given, the result is also the empty array.
|
|
|
|
|
*
|
|
|
|
|
* The array keys are ignored. This implementation uses the internal
|
|
|
|
|
* pointers of the input arrays to keep track of the current position
|
|
|
|
|
* without referring to the keys.
|
|
|
|
|
*
|
|
|
|
|
* @since 1.35
|
|
|
|
|
*
|
|
|
|
|
* @param array ...$inputArrays
|
|
|
|
|
* @return array
|
|
|
|
|
*/
|
|
|
|
|
public static function cartesianProduct( ...$inputArrays ) {
|
|
|
|
|
$numInputs = count( $inputArrays );
|
|
|
|
|
if ( $numInputs === 0 ) {
|
|
|
|
|
return [];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Reset the internal pointers
|
|
|
|
|
foreach ( $inputArrays as &$inputArray ) {
|
|
|
|
|
if ( !count( $inputArray ) ) {
|
|
|
|
|
return [];
|
|
|
|
|
}
|
|
|
|
|
reset( $inputArray );
|
|
|
|
|
}
|
|
|
|
|
unset( $inputArray );
|
|
|
|
|
|
|
|
|
|
$outputArrays = [];
|
|
|
|
|
$done = false;
|
|
|
|
|
while ( !$done ) {
|
|
|
|
|
// Construct the output array element
|
|
|
|
|
$element = [];
|
2022-09-21 19:05:03 +00:00
|
|
|
foreach ( $inputArrays as $inputArray ) {
|
Introduce $wgForceHTTPS
Add $wgForceHTTPS. When set to true:
* It makes the HTTP to HTTPS redirect unconditional and suppresses the
forceHTTPS cookie.
* It makes session cookies be secure.
* In the Action API, it triggers the existing deprecation warning and
avoids more expensive user/session checks.
* In login and signup, it suppresses the old hidden form fields for
protocol switching.
* It hides the prefershttps user preference.
Other changes:
* Factor out the HTTPS redirect in MediaWiki::main() into
maybeDoHttpsRedirect() and shouldDoHttpRedirect(). Improve
documentation.
* User::requiresHTTPS() reflects $wgForceHTTPS whereas the Session
concept of "force HTTPS" does not. The documentation of
User::requiresHTTPS() says that it includes configuration, and
retaining this definition was beneficial for some callers. Whereas
Session::shouldForceHTTPS() was used fairly narrowly as the value
of the forceHTTPS cookie, and injecting configuration into it is not
so easy or beneficial, so I left it as it was, except for clarifying
the documentation.
* Deprecate the following hooks: BeforeHttpsRedirect, UserRequiresHTTPS,
CanIPUseHTTPS. No known extension uses them, and they're not compatible
with the long-term goal of ending support for mixed-protocol wikis.
BeforeHttpsRedirect was documented as unstable from its inception.
CanIPUseHTTPS was a WMF config hack now superseded by GFOC's SNI
sniffing.
* For tests which failed with $wgForceHTTPS=true, I mostly split the
tests, testing each configuration value separately.
* Add ArrayUtils::cartesianProduct() as a helper for generating
combinations of boolean options in the session tests.
Bug: T256095
Change-Id: Iefb5ba55af35350dfc7c050f9fb8f4e8a79751cb
2020-06-24 00:56:46 +00:00
|
|
|
$element[] = current( $inputArray );
|
|
|
|
|
}
|
|
|
|
|
$outputArrays[] = $element;
|
|
|
|
|
|
|
|
|
|
// Increment the pointers starting from the least significant.
|
|
|
|
|
// If the least significant rolls over back to the start of the
|
|
|
|
|
// array, continue with the next most significant, and so on until
|
|
|
|
|
// that stops happening. If all pointers roll over, we are done.
|
|
|
|
|
$done = true;
|
|
|
|
|
for ( $paramIndex = $numInputs - 1; $paramIndex >= 0; $paramIndex-- ) {
|
|
|
|
|
next( $inputArrays[$paramIndex] );
|
|
|
|
|
if ( key( $inputArrays[$paramIndex] ) === null ) {
|
|
|
|
|
reset( $inputArrays[$paramIndex] );
|
|
|
|
|
// continue
|
|
|
|
|
} else {
|
|
|
|
|
$done = false;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return $outputArrays;
|
|
|
|
|
}
|
2013-01-04 09:23:26 +00:00
|
|
|
}
|