2010-12-14 16:26:35 +00:00
|
|
|
<?php
|
|
|
|
|
|
2023-11-21 21:08:14 +00:00
|
|
|
use MediaWiki\Deferred\SearchUpdate;
|
2023-07-20 21:37:24 +00:00
|
|
|
use MediaWiki\Page\PageIdentityValue;
|
2023-03-01 20:33:26 +00:00
|
|
|
|
2010-12-14 16:26:35 +00:00
|
|
|
/**
|
|
|
|
|
* @group Search
|
2024-01-27 00:11:07 +00:00
|
|
|
* @covers \MediaWiki\Deferred\SearchUpdate
|
2010-12-14 16:26:35 +00:00
|
|
|
*/
|
2020-06-30 15:09:24 +00:00
|
|
|
class SearchUpdateTest extends MediaWikiIntegrationTestCase {
|
2012-10-08 10:56:20 +00:00
|
|
|
|
2016-04-03 08:37:11 +00:00
|
|
|
/**
|
|
|
|
|
* @var SearchUpdate
|
|
|
|
|
*/
|
|
|
|
|
private $su;
|
|
|
|
|
|
2021-07-22 03:11:47 +00:00
|
|
|
protected function setUp(): void {
|
2012-10-08 10:56:20 +00:00
|
|
|
parent::setUp();
|
2023-07-20 21:37:24 +00:00
|
|
|
$pageIdentity = new PageIdentityValue( 42, NS_MAIN, 'Main_Page', PageIdentityValue::LOCAL );
|
2021-05-07 22:19:29 +00:00
|
|
|
$this->su = new SearchUpdate( 0, $pageIdentity );
|
2012-10-08 10:56:20 +00:00
|
|
|
}
|
2010-12-14 16:26:35 +00:00
|
|
|
|
2014-03-07 20:22:13 +00:00
|
|
|
public function updateText( $text ) {
|
2016-04-03 08:37:11 +00:00
|
|
|
return trim( $this->su->updateText( $text ) );
|
2010-12-14 16:26:35 +00:00
|
|
|
}
|
|
|
|
|
|
2013-10-23 22:51:31 +00:00
|
|
|
public function testUpdateText() {
|
2010-12-14 16:26:35 +00:00
|
|
|
$this->assertEquals(
|
|
|
|
|
'test',
|
|
|
|
|
$this->updateText( '<div>TeSt</div>' ),
|
|
|
|
|
'HTML stripped, text lowercased'
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
$this->assertEquals(
|
|
|
|
|
'foo bar boz quux',
|
|
|
|
|
$this->updateText( <<<EOT
|
|
|
|
|
<table style="color:red; font-size:100px">
|
|
|
|
|
<tr class="scary"><td><div>foo</div></td><tr>bar</td></tr>
|
|
|
|
|
<tr><td>boz</td><tr>quux</td></tr>
|
|
|
|
|
</table>
|
|
|
|
|
EOT
|
|
|
|
|
), 'Stripping HTML tables' );
|
|
|
|
|
|
|
|
|
|
$this->assertEquals(
|
|
|
|
|
'a b',
|
|
|
|
|
$this->updateText( 'a > b' ),
|
|
|
|
|
'Handle unclosed tags'
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
$text = str_pad( "foo <barbarbar \n", 10000, 'x' );
|
|
|
|
|
|
|
|
|
|
$this->assertNotEquals(
|
|
|
|
|
'',
|
|
|
|
|
$this->updateText( $text ),
|
2017-02-20 23:45:58 +00:00
|
|
|
'T20609'
|
2010-12-14 16:26:35 +00:00
|
|
|
);
|
|
|
|
|
}
|
2011-11-30 00:36:34 +00:00
|
|
|
|
2013-10-24 20:30:43 +00:00
|
|
|
/**
|
deferred: Widen `@covers` annotations in unit tests
Follows-up I98d2ecc987, I7555c9b6b5, I6d845bdfbb, I69b5385868, I4c7d826c7e,
I1287f3979a, which widened the `@covers` annotations of other suites:
> We lose useful coverage and spend valuable time keeping these tags
> accurate through refactors (or worse, forget to do so).
>
> I've audited each test to confirm it is a general test of the
> subject class, where adding any called methods would be an accepted
> change, thus widening it is merely a no-op that clarifies intent
> and reduces maintenance. I am not disabling the "only track coverage
> of specified subject" benefits, nor am I claiming coverage in
> in classes outside the subject under test.
>
> Tracking tiny details per-method wastes time in keeping references
> in sync during refactors, time to realize (and fix) when people
> inevitably don't keep them in sync, time lost in finding uncovered
> code to write tests for only to realize it was already covered but
> not yet claimed, etc.
Change-Id: I133c7b707aab7ceb4f2ecd3be38bd4bd1b194143
2023-08-21 23:01:58 +00:00
|
|
|
* T34712: Test if unicode quotes in article links make its search index empty
|
2013-10-24 20:30:43 +00:00
|
|
|
*/
|
2014-12-30 08:26:18 +00:00
|
|
|
public function testUnicodeLinkSearchIndexError() {
|
2011-11-30 00:36:34 +00:00
|
|
|
$text = "text „http://example.com“ text";
|
|
|
|
|
$result = $this->updateText( $text );
|
|
|
|
|
$processed = preg_replace( '/Q/u', 'Q', $result );
|
|
|
|
|
$this->assertTrue(
|
|
|
|
|
$processed != '',
|
|
|
|
|
'Link surrounded by unicode quotes should not fail UTF-8 validation'
|
|
|
|
|
);
|
|
|
|
|
}
|
2010-12-14 16:26:35 +00:00
|
|
|
}
|