composer: * mediawiki/mediawiki-codesniffer: 36.0.0 → 37.0.0 The following sniffs now pass and were enabled: * Generic.ControlStructures.InlineControlStructure * MediaWiki.PHPUnit.AssertCount.NotUsed npm: * svgo: 2.3.0 → 2.3.1 * https://npmjs.com/advisories/1754 (CVE-2021-33587) Change-Id: I2a9bbee2fecbf7259876d335f565ece4b3622426
523 lines
16 KiB
PHP
523 lines
16 KiB
PHP
<?php
|
||
|
||
use MediaWiki\MediaWikiServices;
|
||
use Wikimedia\Rdbms\LoadBalancerSingle;
|
||
|
||
/**
|
||
* @group Search
|
||
* @group Database
|
||
*
|
||
* @covers SearchEngine<extended>
|
||
* @note Coverage will only ever show one of on of the Search* classes
|
||
*/
|
||
class SearchEngineTest extends MediaWikiLangTestCase {
|
||
|
||
/**
|
||
* @var SearchEngine
|
||
*/
|
||
protected $search;
|
||
|
||
/**
|
||
* Checks for database type & version.
|
||
* Will skip current test if DB does not support search.
|
||
*/
|
||
protected function setUp(): void {
|
||
parent::setUp();
|
||
|
||
// Search tests require MySQL or SQLite with FTS
|
||
$dbType = $this->db->getType();
|
||
$dbSupported = ( $dbType === 'mysql' )
|
||
|| ( $dbType === 'sqlite' && $this->db->getFulltextSearchModule() == 'FTS3' );
|
||
|
||
if ( !$dbSupported ) {
|
||
$this->markTestSkipped( "MySQL or SQLite with FTS3 only" );
|
||
}
|
||
|
||
$searchType = SearchEngineFactory::getSearchEngineClass( $this->db );
|
||
$this->setMwGlobals( [
|
||
'wgSearchType' => $searchType,
|
||
'wgCapitalLinks' => true,
|
||
'wgCapitalLinkOverrides' => [
|
||
NS_CATEGORY => false // for testCompletionSearchMustRespectCapitalLinkOverrides
|
||
],
|
||
] );
|
||
|
||
$lb = LoadBalancerSingle::newFromConnection( $this->db );
|
||
$this->search = new $searchType( $lb );
|
||
$this->search->setHookContainer( MediaWikiServices::getInstance()->getHookContainer() );
|
||
}
|
||
|
||
protected function tearDown(): void {
|
||
unset( $this->search );
|
||
|
||
parent::tearDown();
|
||
}
|
||
|
||
public function addDBDataOnce() {
|
||
if ( !$this->isWikitextNS( NS_MAIN ) ) {
|
||
// @todo cover the case of non-wikitext content in the main namespace
|
||
return;
|
||
}
|
||
|
||
// Reset the search type back to default - some extensions may have
|
||
// overridden it.
|
||
$this->setMwGlobals( [
|
||
'wgSearchType' => null,
|
||
'wgCapitalLinks' => true,
|
||
'wgCapitalLinkOverrides' => [
|
||
NS_CATEGORY => false // for testCompletionSearchMustRespectCapitalLinkOverrides
|
||
],
|
||
] );
|
||
|
||
$this->insertPage( 'Not_Main_Page', 'This is not a main page' );
|
||
$this->insertPage(
|
||
'Talk:Not_Main_Page',
|
||
'This is not a talk page to the main page, see [[smithee]]'
|
||
);
|
||
$this->insertPage( 'Smithee', 'A smithee is one who smiths. See also [[Alan Smithee]]' );
|
||
$this->insertPage( 'Talk:Smithee', 'This article sucks.' );
|
||
$this->insertPage( 'Unrelated_page', 'Nothing in this page is about the S word.' );
|
||
$this->insertPage( 'Another_page', 'This page also is unrelated.' );
|
||
$this->insertPage( 'Help:Help', 'Help me!' );
|
||
$this->insertPage( 'Thppt', 'Blah blah' );
|
||
$this->insertPage( 'Alan_Smithee', 'yum' );
|
||
$this->insertPage( 'Pages', 'are\'food' );
|
||
$this->insertPage( 'HalfOneUp', 'AZ' );
|
||
$this->insertPage( 'FullOneUp', 'AZ' );
|
||
$this->insertPage( 'HalfTwoLow', 'az' );
|
||
$this->insertPage( 'FullTwoLow', 'az' );
|
||
$this->insertPage( 'HalfNumbers', '1234567890' );
|
||
$this->insertPage( 'FullNumbers', '1234567890' );
|
||
$this->insertPage( 'DomainName', 'example.com' );
|
||
$this->insertPage( 'DomainName', 'example.com' );
|
||
$this->insertPage( 'Category:search is not Search', '' );
|
||
$this->insertPage( 'Category:Search is not search', '' );
|
||
}
|
||
|
||
protected function fetchIds( $results ) {
|
||
if ( !$this->isWikitextNS( NS_MAIN ) ) {
|
||
$this->markTestIncomplete( __CLASS__ . " does no yet support non-wikitext content "
|
||
. "in the main namespace" );
|
||
}
|
||
$this->assertIsObject( $results );
|
||
|
||
$matches = [];
|
||
foreach ( $results as $row ) {
|
||
$matches[] = $row->getTitle()->getPrefixedText();
|
||
}
|
||
$results->free();
|
||
# Search is not guaranteed to return results in a certain order;
|
||
# sort them numerically so we will compare simply that we received
|
||
# the expected matches.
|
||
sort( $matches );
|
||
|
||
return $matches;
|
||
}
|
||
|
||
public function testFullWidth() {
|
||
$this->assertEquals(
|
||
[ 'FullOneUp', 'FullTwoLow', 'HalfOneUp', 'HalfTwoLow' ],
|
||
$this->fetchIds( $this->search->searchText( 'AZ' ) ),
|
||
"Search for normalized from Half-width Upper" );
|
||
$this->assertEquals(
|
||
[ 'FullOneUp', 'FullTwoLow', 'HalfOneUp', 'HalfTwoLow' ],
|
||
$this->fetchIds( $this->search->searchText( 'az' ) ),
|
||
"Search for normalized from Half-width Lower" );
|
||
$this->assertEquals(
|
||
[ 'FullOneUp', 'FullTwoLow', 'HalfOneUp', 'HalfTwoLow' ],
|
||
$this->fetchIds( $this->search->searchText( 'AZ' ) ),
|
||
"Search for normalized from Full-width Upper" );
|
||
$this->assertEquals(
|
||
[ 'FullOneUp', 'FullTwoLow', 'HalfOneUp', 'HalfTwoLow' ],
|
||
$this->fetchIds( $this->search->searchText( 'az' ) ),
|
||
"Search for normalized from Full-width Lower" );
|
||
}
|
||
|
||
public function testTextSearch() {
|
||
$this->assertEquals(
|
||
[ 'Smithee' ],
|
||
$this->fetchIds( $this->search->searchText( 'smithee' ) ),
|
||
"Plain search" );
|
||
}
|
||
|
||
public function testWildcardSearch() {
|
||
$res = $this->search->searchText( 'smith*' );
|
||
$this->assertEquals(
|
||
[ 'Smithee' ],
|
||
$this->fetchIds( $res ),
|
||
"Search with wildcards" );
|
||
|
||
$res = $this->search->searchText( 'smithson*' );
|
||
$this->assertEquals(
|
||
[],
|
||
$this->fetchIds( $res ),
|
||
"Search with wildcards must not find unrelated articles" );
|
||
|
||
$res = $this->search->searchText( 'smith* smithee' );
|
||
$this->assertEquals(
|
||
[ 'Smithee' ],
|
||
$this->fetchIds( $res ),
|
||
"Search with wildcards can be combined with simple terms" );
|
||
|
||
$res = $this->search->searchText( 'smith* "one who smiths"' );
|
||
$this->assertEquals(
|
||
[ 'Smithee' ],
|
||
$this->fetchIds( $res ),
|
||
"Search with wildcards can be combined with phrase search" );
|
||
}
|
||
|
||
public function testPhraseSearch() {
|
||
$res = $this->search->searchText( '"smithee is one who smiths"' );
|
||
$this->assertEquals(
|
||
[ 'Smithee' ],
|
||
$this->fetchIds( $res ),
|
||
"Search a phrase" );
|
||
|
||
$res = $this->search->searchText( '"smithee is who smiths"' );
|
||
$this->assertEquals(
|
||
[],
|
||
$this->fetchIds( $res ),
|
||
"Phrase search is not sloppy, search terms must be adjacent" );
|
||
|
||
$res = $this->search->searchText( '"is smithee one who smiths"' );
|
||
$this->assertEquals(
|
||
[],
|
||
$this->fetchIds( $res ),
|
||
"Phrase search is ordered" );
|
||
}
|
||
|
||
public function testPhraseSearchHighlight() {
|
||
$phrase = "smithee is one who smiths";
|
||
$res = $this->search->searchText( "\"$phrase\"" );
|
||
$match = $res->getIterator()->current();
|
||
$snippet = "A <span class='searchmatch'>" . $phrase . "</span>";
|
||
$this->assertStringStartsWith( $snippet,
|
||
$match->getTextSnippet(),
|
||
"Highlight a phrase search" );
|
||
}
|
||
|
||
public function testTextPowerSearch() {
|
||
$this->search->setNamespaces( [ 0, 1, 4 ] );
|
||
$this->assertEquals(
|
||
[
|
||
'Smithee',
|
||
'Talk:Not Main Page',
|
||
],
|
||
$this->fetchIds( $this->search->searchText( 'smithee' ) ),
|
||
"Power search" );
|
||
}
|
||
|
||
public function testTitleSearch() {
|
||
$this->assertEquals(
|
||
[
|
||
'Alan Smithee',
|
||
'Smithee',
|
||
],
|
||
$this->fetchIds( $this->search->searchTitle( 'smithee' ) ),
|
||
"Title search" );
|
||
}
|
||
|
||
public function testTextTitlePowerSearch() {
|
||
$this->search->setNamespaces( [ 0, 1, 4 ] );
|
||
$this->assertEquals(
|
||
[
|
||
'Alan Smithee',
|
||
'Smithee',
|
||
'Talk:Smithee',
|
||
],
|
||
$this->fetchIds( $this->search->searchTitle( 'smithee' ) ),
|
||
"Title power search" );
|
||
}
|
||
|
||
public function provideCompletionSearchMustRespectCapitalLinkOverrides() {
|
||
return [
|
||
'Searching for "smithee" finds Smithee on NS_MAIN' => [
|
||
'smithee',
|
||
'Smithee',
|
||
[ NS_MAIN ],
|
||
],
|
||
'Searching for "search is" will finds "search is not Search" on NS_CATEGORY' => [
|
||
'search is',
|
||
'Category:search is not Search',
|
||
[ NS_CATEGORY ],
|
||
],
|
||
'Searching for "Search is" will finds "search is not Search" on NS_CATEGORY' => [
|
||
'Search is',
|
||
'Category:Search is not search',
|
||
[ NS_CATEGORY ],
|
||
],
|
||
'Copy-pasted wikilinks with invalid characters will still find the page' => [
|
||
'[[smithee]]',
|
||
'Smithee',
|
||
[ NS_MAIN ],
|
||
],
|
||
];
|
||
}
|
||
|
||
/**
|
||
* Test that the search query is not munged using wrong CapitalLinks setup
|
||
* (in other test that the default search backend can benefit from wgCapitalLinksOverride)
|
||
* Guard against regressions like T208255
|
||
* @dataProvider provideCompletionSearchMustRespectCapitalLinkOverrides
|
||
* @covers SearchEngine::completionSearch
|
||
* @covers PrefixSearch::defaultSearchBackend
|
||
* @param string $search
|
||
* @param string $expectedSuggestion
|
||
* @param int[] $namespaces
|
||
*/
|
||
public function testCompletionSearchMustRespectCapitalLinkOverrides(
|
||
$search,
|
||
$expectedSuggestion,
|
||
array $namespaces
|
||
) {
|
||
$this->search->setNamespaces( $namespaces );
|
||
$results = $this->search->completionSearch( $search );
|
||
$this->assertSame( 1, $results->getSize() );
|
||
$this->assertEquals( $expectedSuggestion, $results->getSuggestions()[0]->getText() );
|
||
}
|
||
|
||
/**
|
||
* @covers SearchEngine::getSearchIndexFields
|
||
*/
|
||
public function testSearchIndexFields() {
|
||
/**
|
||
* @var SearchEngine $mockEngine
|
||
*/
|
||
$mockEngine = $this->getMockBuilder( SearchEngine::class )
|
||
->onlyMethods( [ 'makeSearchFieldMapping' ] )->getMock();
|
||
|
||
$mockFieldBuilder = function ( $name, $type ) {
|
||
$mockField =
|
||
$this->getMockBuilder( SearchIndexFieldDefinition::class )->setConstructorArgs( [
|
||
$name,
|
||
$type,
|
||
] )->getMock();
|
||
|
||
$mockField->method( 'getMapping' )->willReturn( [
|
||
'testData' => 'test',
|
||
'name' => $name,
|
||
'type' => $type,
|
||
] );
|
||
|
||
$mockField->method( 'merge' )
|
||
->willReturn( $mockField );
|
||
|
||
return $mockField;
|
||
};
|
||
|
||
$mockEngine->expects( $this->atLeastOnce() )
|
||
->method( 'makeSearchFieldMapping' )
|
||
->willReturnCallback( $mockFieldBuilder );
|
||
|
||
// Not using mock since PHPUnit mocks do not work properly with references in params
|
||
$this->setTemporaryHook( 'SearchIndexFields',
|
||
static function ( &$fields, SearchEngine $engine ) use ( $mockFieldBuilder ) {
|
||
$fields['testField'] =
|
||
$mockFieldBuilder( "testField", SearchIndexField::INDEX_TYPE_TEXT );
|
||
return true;
|
||
} );
|
||
$mockEngine->setHookContainer( MediaWikiServices::getInstance()->getHookContainer() );
|
||
|
||
$fields = $mockEngine->getSearchIndexFields();
|
||
$this->assertArrayHasKey( 'language', $fields );
|
||
$this->assertArrayHasKey( 'category', $fields );
|
||
$this->assertInstanceOf( SearchIndexField::class, $fields['testField'] );
|
||
|
||
$mapping = $fields['testField']->getMapping( $mockEngine );
|
||
$this->assertArrayHasKey( 'testData', $mapping );
|
||
$this->assertEquals( 'test', $mapping['testData'] );
|
||
}
|
||
|
||
public function hookSearchIndexFields( $mockFieldBuilder, &$fields, SearchEngine $engine ) {
|
||
$fields['testField'] = $mockFieldBuilder( "testField", SearchIndexField::INDEX_TYPE_TEXT );
|
||
return true;
|
||
}
|
||
|
||
public function testAugmentorSearch() {
|
||
$this->search->setNamespaces( [ 0, 1, 4 ] );
|
||
$resultSet = $this->search->searchText( 'smithee' );
|
||
// Not using mock since PHPUnit mocks do not work properly with references in params
|
||
$this->mergeMwGlobalArrayValue( 'wgHooks',
|
||
[ 'SearchResultsAugment' => [ [ $this, 'addAugmentors' ] ] ] );
|
||
$this->search->augmentSearchResults( $resultSet );
|
||
foreach ( $resultSet as $result ) {
|
||
$id = $result->getTitle()->getArticleID();
|
||
$augmentData = "Result:$id:" . $result->getTitle()->getText();
|
||
$augmentData2 = "Result2:$id:" . $result->getTitle()->getText();
|
||
$this->assertEquals( [ 'testSet' => $augmentData, 'testRow' => $augmentData2 ],
|
||
$result->getExtensionData() );
|
||
}
|
||
}
|
||
|
||
public function addAugmentors( &$setAugmentors, &$rowAugmentors ) {
|
||
$setAugmentor = $this->createMock( ResultSetAugmentor::class );
|
||
$setAugmentor->expects( $this->once() )
|
||
->method( 'augmentAll' )
|
||
->willReturnCallback( static function ( ISearchResultSet $resultSet ) {
|
||
$data = [];
|
||
/** @var SearchResult $result */
|
||
foreach ( $resultSet as $result ) {
|
||
$id = $result->getTitle()->getArticleID();
|
||
$data[$id] = "Result:$id:" . $result->getTitle()->getText();
|
||
}
|
||
return $data;
|
||
} );
|
||
$setAugmentors['testSet'] = $setAugmentor;
|
||
|
||
$rowAugmentor = $this->createMock( ResultAugmentor::class );
|
||
$rowAugmentor->expects( $this->exactly( 2 ) )
|
||
->method( 'augment' )
|
||
->willReturnCallback( static function ( SearchResult $result ) {
|
||
$id = $result->getTitle()->getArticleID();
|
||
return "Result2:$id:" . $result->getTitle()->getText();
|
||
} );
|
||
$rowAugmentors['testRow'] = $rowAugmentor;
|
||
}
|
||
|
||
public function testFiltersMissing() {
|
||
$availableResults = [];
|
||
foreach ( range( 0, 11 ) as $i ) {
|
||
$title = "Search_Result_$i";
|
||
$availableResults[] = $title;
|
||
// pages not created must be filtered
|
||
if ( $i % 2 == 0 ) {
|
||
$this->editSearchResultPage( $title );
|
||
}
|
||
}
|
||
MockCompletionSearchEngine::addMockResults( 'foo', $availableResults );
|
||
|
||
$engine = new MockCompletionSearchEngine();
|
||
$engine->setLimitOffset( 10, 0 );
|
||
$engine->setHookContainer( MediaWikiServices::getInstance()->getHookContainer() );
|
||
$results = $engine->completionSearch( 'foo' );
|
||
$this->assertEquals( 5, $results->getSize() );
|
||
$this->assertTrue( $results->hasMoreResults() );
|
||
|
||
$engine->setLimitOffset( 10, 10 );
|
||
$results = $engine->completionSearch( 'foo' );
|
||
$this->assertSame( 1, $results->getSize() );
|
||
$this->assertFalse( $results->hasMoreResults() );
|
||
}
|
||
|
||
private function editSearchResultPage( $title ) {
|
||
$page = WikiPage::factory( Title::newFromText( $title ) );
|
||
$page->doUserEditContent(
|
||
new WikitextContent( 'UTContent' ),
|
||
$this->getTestSysop()->getUser(),
|
||
'UTPageSummary',
|
||
EDIT_NEW | EDIT_SUPPRESS_RC
|
||
);
|
||
}
|
||
|
||
public function provideDataForParseNamespacePrefix() {
|
||
return [
|
||
'noop' => [
|
||
[
|
||
'query' => 'foo',
|
||
],
|
||
false,
|
||
],
|
||
'empty' => [
|
||
[
|
||
'query' => '',
|
||
],
|
||
false,
|
||
],
|
||
'namespace prefix' => [
|
||
[
|
||
'query' => 'help:test',
|
||
],
|
||
[ 'test', [ NS_HELP ] ],
|
||
],
|
||
'accented namespace prefix with hook' => [
|
||
[
|
||
'query' => 'hélp:test',
|
||
'withHook' => true,
|
||
],
|
||
[ 'test', [ NS_HELP ] ],
|
||
],
|
||
'accented namespace prefix without hook' => [
|
||
[
|
||
'query' => 'hélp:test',
|
||
'withHook' => false,
|
||
],
|
||
false,
|
||
],
|
||
'all with all keyword allowed' => [
|
||
[
|
||
'query' => 'all:test',
|
||
'withAll' => true,
|
||
],
|
||
[ 'test', null ],
|
||
],
|
||
'all with all keyword disallowed' => [
|
||
[
|
||
'query' => 'all:test',
|
||
'withAll' => false,
|
||
],
|
||
false,
|
||
],
|
||
'ns only' => [
|
||
[
|
||
'query' => 'help:',
|
||
],
|
||
[ '', [ NS_HELP ] ],
|
||
],
|
||
'all only' => [
|
||
[
|
||
'query' => 'all:',
|
||
'withAll' => true,
|
||
],
|
||
[ '', null ],
|
||
],
|
||
'all wins over namespace when first' => [
|
||
[
|
||
'query' => 'all:help:test',
|
||
'withAll' => true,
|
||
],
|
||
[ 'help:test', null ],
|
||
],
|
||
'ns wins over all when first' => [
|
||
[
|
||
'query' => 'help:all:test',
|
||
'withAll' => true,
|
||
],
|
||
[ 'all:test', [ NS_HELP ] ],
|
||
],
|
||
];
|
||
}
|
||
|
||
/**
|
||
* @dataProvider provideDataForParseNamespacePrefix
|
||
*/
|
||
public function testParseNamespacePrefix( array $params, $expected ) {
|
||
$this->setTemporaryHook( 'PrefixSearchExtractNamespace', static function ( &$namespaces, &$query ) {
|
||
if ( strpos( $query, 'hélp:' ) === 0 ) {
|
||
$namespaces = [ NS_HELP ];
|
||
$query = substr( $query, strlen( 'hélp:' ) );
|
||
}
|
||
return false;
|
||
} );
|
||
$testSet = [];
|
||
if ( isset( $params['withAll'] ) && isset( $params['withHook'] ) ) {
|
||
$testSet[] = $params;
|
||
} elseif ( isset( $params['withAll'] ) ) {
|
||
$testSet[] = $params + [ 'withHook' => true ];
|
||
$testSet[] = $params + [ 'withHook' => false ];
|
||
} elseif ( isset( $params['withHook'] ) ) {
|
||
$testSet[] = $params + [ 'withAll' => true ];
|
||
$testSet[] = $params + [ 'withAll' => false ];
|
||
} else {
|
||
$testSet[] = $params + [ 'withAll' => true, 'withHook' => true ];
|
||
$testSet[] = $params + [ 'withAll' => true, 'withHook' => false ];
|
||
$testSet[] = $params + [ 'withAll' => false, 'withHook' => false ];
|
||
$testSet[] = $params + [ 'withAll' => true, 'withHook' => false ];
|
||
}
|
||
|
||
foreach ( $testSet as $test ) {
|
||
$actual = SearchEngine::parseNamespacePrefixes( $test['query'],
|
||
$test['withAll'], $test['withHook'] );
|
||
$this->assertEquals( $expected, $actual, 'with params: ' . print_r( $test, true ) );
|
||
}
|
||
}
|
||
}
|