2004-02-18 02:15:00 +00:00
|
|
|
<?php
|
2004-03-20 14:33:18 +00:00
|
|
|
# Cache for article titles (prefixed DB keys) and ids linked from one source
|
2003-04-14 23:10:40 +00:00
|
|
|
|
2003-07-06 11:42:42 +00:00
|
|
|
# These are used in incrementalSetup()
|
|
|
|
|
define ('LINKCACHE_GOOD', 0);
|
|
|
|
|
define ('LINKCACHE_BAD', 1);
|
|
|
|
|
define ('LINKCACHE_IMAGE', 2);
|
|
|
|
|
|
2003-11-27 19:53:40 +00:00
|
|
|
class LinkCache {
|
|
|
|
|
// Increment $mClassVer whenever old serialized versions of this class
|
|
|
|
|
// becomes incompatible with the new version.
|
2004-05-15 00:29:39 +00:00
|
|
|
/* private */ var $mClassVer = 2;
|
2003-04-14 23:10:40 +00:00
|
|
|
|
|
|
|
|
/* private */ var $mGoodLinks, $mBadLinks, $mActive;
|
2004-05-15 00:29:39 +00:00
|
|
|
/* private */ var $mImageLinks, $mCategoryLinks;
|
2003-07-06 11:42:42 +00:00
|
|
|
/* private */ var $mPreFilled, $mOldGoodLinks, $mOldBadLinks;
|
|
|
|
|
|
2003-11-04 08:59:28 +00:00
|
|
|
/* private */ function getKey( $title ) {
|
|
|
|
|
global $wgDBname;
|
|
|
|
|
return "$wgDBname:lc:title:$title";
|
|
|
|
|
}
|
|
|
|
|
|
2003-04-14 23:10:40 +00:00
|
|
|
function LinkCache()
|
|
|
|
|
{
|
|
|
|
|
$this->mActive = true;
|
2003-07-06 11:42:42 +00:00
|
|
|
$this->mPreFilled = false;
|
2003-04-14 23:10:40 +00:00
|
|
|
$this->mGoodLinks = array();
|
|
|
|
|
$this->mBadLinks = array();
|
|
|
|
|
$this->mImageLinks = array();
|
2004-05-15 00:29:39 +00:00
|
|
|
$this->mCategoryLinks = array();
|
2003-07-06 11:42:42 +00:00
|
|
|
$this->mOldGoodLinks = array();
|
|
|
|
|
$this->mOldBadLinks = array();
|
2003-04-14 23:10:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function getGoodLinkID( $title )
|
|
|
|
|
{
|
|
|
|
|
if ( array_key_exists( $title, $this->mGoodLinks ) ) {
|
|
|
|
|
return $this->mGoodLinks[$title];
|
|
|
|
|
} else {
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function isBadLink( $title )
|
|
|
|
|
{
|
2003-11-24 19:49:32 +00:00
|
|
|
return array_key_exists( $title, $this->mBadLinks );
|
2003-04-14 23:10:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function addGoodLink( $id, $title )
|
|
|
|
|
{
|
|
|
|
|
if ( $this->mActive ) {
|
|
|
|
|
$this->mGoodLinks[$title] = $id;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function addBadLink( $title )
|
|
|
|
|
{
|
|
|
|
|
if ( $this->mActive && ( ! $this->isBadLink( $title ) ) ) {
|
2003-11-24 19:49:32 +00:00
|
|
|
$this->mBadLinks[$title] = 1;
|
2003-04-14 23:10:40 +00:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function addImageLink( $title )
|
|
|
|
|
{
|
|
|
|
|
if ( $this->mActive ) { $this->mImageLinks[$title] = 1; }
|
|
|
|
|
}
|
|
|
|
|
|
2003-11-04 08:59:28 +00:00
|
|
|
function addImageLinkObj( $nt )
|
|
|
|
|
{
|
|
|
|
|
if ( $this->mActive ) { $this->mImageLinks[$nt->getDBkey()] = 1; }
|
|
|
|
|
}
|
2004-05-15 00:29:39 +00:00
|
|
|
|
|
|
|
|
function addCategoryLink( $title, $sortkey ) {
|
|
|
|
|
if ( $this->mActive ) { $this->mCategoryLinks[$title] = $sortkey; }
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function addCategoryLinkObj( &$nt, $sortkey ) {
|
|
|
|
|
$this->addCategoryLink( $nt->getDBkey(), $sortkey );
|
|
|
|
|
}
|
2003-11-04 08:59:28 +00:00
|
|
|
|
2003-04-14 23:10:40 +00:00
|
|
|
function clearBadLink( $title )
|
|
|
|
|
{
|
2003-11-24 19:49:32 +00:00
|
|
|
unset( $this->mBadLinks[$title] );
|
2003-11-04 08:59:28 +00:00
|
|
|
$this->clearLink( $title );
|
|
|
|
|
}
|
|
|
|
|
|
2003-11-12 10:21:28 +00:00
|
|
|
function clearLink( $title )
|
|
|
|
|
{
|
|
|
|
|
global $wgMemc, $wgLinkCacheMemcached;
|
|
|
|
|
if( $wgLinkCacheMemcached )
|
|
|
|
|
$wgMemc->delete( $this->getKey( $title ) );
|
2003-04-14 23:10:40 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function suspend() { $this->mActive = false; }
|
|
|
|
|
function resume() { $this->mActive = true; }
|
|
|
|
|
function getGoodLinks() { return $this->mGoodLinks; }
|
2003-11-24 19:49:32 +00:00
|
|
|
function getBadLinks() { return array_keys( $this->mBadLinks ); }
|
2003-04-14 23:10:40 +00:00
|
|
|
function getImageLinks() { return $this->mImageLinks; }
|
2004-05-15 00:29:39 +00:00
|
|
|
function getCategoryLinks() { return $this->mCategoryLinks; }
|
2003-04-14 23:10:40 +00:00
|
|
|
|
|
|
|
|
function addLink( $title )
|
|
|
|
|
{
|
2003-11-04 08:59:28 +00:00
|
|
|
$nt = Title::newFromDBkey( $title );
|
|
|
|
|
if( $nt ) {
|
|
|
|
|
return $this->addLinkObj( $nt );
|
|
|
|
|
} else {
|
|
|
|
|
return 0;
|
|
|
|
|
}
|
2003-10-22 23:56:49 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function addLinkObj( &$nt )
|
|
|
|
|
{
|
2003-11-28 08:31:26 +00:00
|
|
|
global $wgMemc, $wgLinkCacheMemcached;
|
2003-11-04 08:59:28 +00:00
|
|
|
$title = $nt->getPrefixedDBkey();
|
2003-11-24 19:49:32 +00:00
|
|
|
if ( $this->isBadLink( $title ) ) { return 0; }
|
2003-04-14 23:10:40 +00:00
|
|
|
$id = $this->getGoodLinkID( $title );
|
|
|
|
|
if ( 0 != $id ) { return $id; }
|
|
|
|
|
|
2003-11-04 08:59:28 +00:00
|
|
|
$fname = "LinkCache::addLinkObj";
|
2003-10-16 13:30:45 +00:00
|
|
|
wfProfileIn( $fname );
|
2003-05-16 13:37:02 +00:00
|
|
|
|
2003-04-14 23:10:40 +00:00
|
|
|
$ns = $nt->getNamespace();
|
2003-11-04 08:59:28 +00:00
|
|
|
$t = $nt->getDBkey();
|
2003-04-14 23:10:40 +00:00
|
|
|
|
2003-10-22 23:56:49 +00:00
|
|
|
if ( "" == $title ) {
|
|
|
|
|
wfProfileOut( $fname );
|
2003-10-16 13:30:45 +00:00
|
|
|
return 0;
|
|
|
|
|
}
|
2003-11-12 10:21:28 +00:00
|
|
|
|
2004-01-31 01:47:54 +00:00
|
|
|
$id = NULL;
|
2003-11-12 10:21:28 +00:00
|
|
|
if( $wgLinkCacheMemcached )
|
|
|
|
|
$id = $wgMemc->get( $key = $this->getKey( $title ) );
|
2004-01-31 01:47:54 +00:00
|
|
|
if( ! is_integer( $id ) ) {
|
2004-07-10 03:09:26 +00:00
|
|
|
$dbr =& wfGetDB( DB_READ );
|
|
|
|
|
$id = $dbr->getField( 'cur', 'cur_id', array( 'cur_namespace' => $ns, 'cur_title' => $t ), $fname );
|
|
|
|
|
if ( !$id ) {
|
2003-08-11 13:53:20 +00:00
|
|
|
$id = 0;
|
|
|
|
|
}
|
2003-11-12 10:21:28 +00:00
|
|
|
if( $wgLinkCacheMemcached )
|
2004-01-31 01:47:54 +00:00
|
|
|
$wgMemc->add( $key, $id, 3600*24 );
|
2003-04-14 23:10:40 +00:00
|
|
|
}
|
2003-11-24 19:49:32 +00:00
|
|
|
|
2003-04-14 23:10:40 +00:00
|
|
|
if ( 0 == $id ) { $this->addBadLink( $title ); }
|
|
|
|
|
else { $this->addGoodLink( $id, $title ); }
|
2003-10-16 13:30:45 +00:00
|
|
|
wfProfileOut( $fname );
|
2003-04-14 23:10:40 +00:00
|
|
|
return $id;
|
|
|
|
|
}
|
|
|
|
|
|
2003-10-22 23:56:49 +00:00
|
|
|
function preFill( &$fromtitle )
|
2003-04-14 23:10:40 +00:00
|
|
|
{
|
2004-01-28 10:26:28 +00:00
|
|
|
global $wgEnablePersistentLC;
|
2003-11-09 11:45:12 +00:00
|
|
|
|
2003-10-16 13:30:45 +00:00
|
|
|
$fname = "LinkCache::preFill";
|
|
|
|
|
wfProfileIn( $fname );
|
2003-04-14 23:10:40 +00:00
|
|
|
# Note -- $fromtitle is a Title *object*
|
2003-11-08 15:12:34 +00:00
|
|
|
|
2004-03-11 09:06:13 +00:00
|
|
|
$this->suspend();
|
|
|
|
|
$id = $fromtitle->getArticleID();
|
|
|
|
|
$this->resume();
|
|
|
|
|
|
|
|
|
|
if( $id == 0 ) {
|
|
|
|
|
wfDebug( "$fname - got id 0 for title '" . $fromtitle->getPrefixedDBkey() . "'\n" );
|
|
|
|
|
wfProfileOut( $fname );
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
2003-11-09 11:45:12 +00:00
|
|
|
if ( $wgEnablePersistentLC ) {
|
2004-03-11 09:06:13 +00:00
|
|
|
if( $this->fillFromLinkscc( $id ) ){
|
2004-06-05 04:44:45 +00:00
|
|
|
wfProfileOut( $fname );
|
2003-11-09 11:45:12 +00:00
|
|
|
return;
|
2004-01-05 20:55:45 +00:00
|
|
|
}
|
2003-11-09 11:45:12 +00:00
|
|
|
}
|
2003-11-08 15:12:34 +00:00
|
|
|
|
2004-07-10 03:09:26 +00:00
|
|
|
$dbr =& wfGetDB( DB_READ );
|
|
|
|
|
$cur = $dbr->tableName( 'cur' );
|
|
|
|
|
$links = $dbr->tableName( 'links' );
|
|
|
|
|
|
2003-11-04 08:59:28 +00:00
|
|
|
$sql = "SELECT cur_id,cur_namespace,cur_title
|
2004-07-10 03:09:26 +00:00
|
|
|
FROM $cur,$links
|
2004-03-11 09:06:13 +00:00
|
|
|
WHERE cur_id=l_to AND l_from=$id";
|
2004-07-10 03:09:26 +00:00
|
|
|
$res = $dbr->query( $sql, $fname );
|
|
|
|
|
while( $s = $dbr->fetchObject( $res ) ) {
|
2003-04-14 23:10:40 +00:00
|
|
|
$this->addGoodLink( $s->cur_id,
|
|
|
|
|
Title::makeName( $s->cur_namespace, $s->cur_title )
|
|
|
|
|
);
|
|
|
|
|
}
|
2003-07-06 11:42:42 +00:00
|
|
|
|
2004-07-10 03:09:26 +00:00
|
|
|
$res = $dbr->select( 'brokenlinks', array( 'bl_to' ), array( 'bl_from' => $id ), $fname );
|
2003-05-16 13:37:02 +00:00
|
|
|
while( $s = wfFetchObject( $res ) ) {
|
|
|
|
|
$this->addBadLink( $s->bl_to );
|
|
|
|
|
}
|
2003-07-06 11:42:42 +00:00
|
|
|
|
|
|
|
|
$this->mOldBadLinks = $this->mBadLinks;
|
|
|
|
|
$this->mOldGoodLinks = $this->mGoodLinks;
|
|
|
|
|
$this->mPreFilled = true;
|
2003-11-08 15:12:34 +00:00
|
|
|
|
2003-11-09 11:45:12 +00:00
|
|
|
if ( $wgEnablePersistentLC ) {
|
2004-03-20 08:41:33 +00:00
|
|
|
$this->saveToLinkscc( $id );
|
2003-11-09 11:45:12 +00:00
|
|
|
}
|
2003-10-16 13:30:45 +00:00
|
|
|
wfProfileOut( $fname );
|
2003-04-14 23:10:40 +00:00
|
|
|
}
|
|
|
|
|
|
2003-07-06 11:42:42 +00:00
|
|
|
function getGoodAdditions()
|
|
|
|
|
{
|
|
|
|
|
return array_diff( $this->mGoodLinks, $this->mOldGoodLinks );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function getBadAdditions()
|
|
|
|
|
{
|
2003-11-25 06:57:24 +00:00
|
|
|
#wfDebug( "mOldBadLinks: " . implode( ', ', array_keys( $this->mOldBadLinks ) ) . "\n" );
|
|
|
|
|
#wfDebug( "mBadLinks: " . implode( ', ', array_keys( $this->mBadLinks ) ) . "\n" );
|
2003-11-24 19:49:32 +00:00
|
|
|
return array_values( array_diff( array_keys( $this->mBadLinks ), array_keys( $this->mOldBadLinks ) ) );
|
2003-07-06 11:42:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function getImageAdditions()
|
|
|
|
|
{
|
|
|
|
|
return array_diff_assoc( $this->mImageLinks, $this->mOldImageLinks );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function getGoodDeletions()
|
|
|
|
|
{
|
|
|
|
|
return array_diff( $this->mOldGoodLinks, $this->mGoodLinks );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function getBadDeletions()
|
|
|
|
|
{
|
2003-11-24 19:49:32 +00:00
|
|
|
return array_values( array_diff( array_keys( $this->mOldBadLinks ), array_keys( $this->mBadLinks ) ));
|
2003-07-06 11:42:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
function getImageDeletions()
|
|
|
|
|
{
|
|
|
|
|
return array_diff_assoc( $this->mOldImageLinks, $this->mImageLinks );
|
|
|
|
|
}
|
2003-04-14 23:10:40 +00:00
|
|
|
|
2003-07-06 11:42:42 +00:00
|
|
|
# Parameters: $which is one of the LINKCACHE_xxx constants, $del and $add are
|
|
|
|
|
# the incremental update arrays which will be filled. Returns whether or not it's
|
|
|
|
|
# worth doing the incremental version. For example, if [[List of mathematical topics]]
|
|
|
|
|
# was blanked, it would take a long, long time to do incrementally.
|
|
|
|
|
function incrementalSetup( $which, &$del, &$add )
|
|
|
|
|
{
|
|
|
|
|
if ( ! $this->mPreFilled ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
switch ( $which ) {
|
|
|
|
|
case LINKCACHE_GOOD:
|
|
|
|
|
$old =& $this->mOldGoodLinks;
|
|
|
|
|
$cur =& $this->mGoodLinks;
|
|
|
|
|
$del = $this->getGoodDeletions();
|
|
|
|
|
$add = $this->getGoodAdditions();
|
|
|
|
|
break;
|
|
|
|
|
case LINKCACHE_BAD:
|
|
|
|
|
$old =& $this->mOldBadLinks;
|
|
|
|
|
$cur =& $this->mBadLinks;
|
|
|
|
|
$del = $this->getBadDeletions();
|
|
|
|
|
$add = $this->getBadAdditions();
|
|
|
|
|
break;
|
|
|
|
|
default: # LINKCACHE_IMAGE
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2003-07-07 13:43:03 +00:00
|
|
|
return true;
|
2003-07-06 11:42:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# Clears cache but leaves old preFill copies alone
|
|
|
|
|
function clear()
|
|
|
|
|
{
|
|
|
|
|
$this->mGoodLinks = array();
|
|
|
|
|
$this->mBadLinks = array();
|
|
|
|
|
$this->mImageLinks = array();
|
|
|
|
|
}
|
2003-11-27 19:53:40 +00:00
|
|
|
|
2004-03-11 09:06:13 +00:00
|
|
|
/* private */ function fillFromLinkscc( $id ){
|
|
|
|
|
$id = IntVal( $id );
|
2004-07-10 03:09:26 +00:00
|
|
|
$dbr =& wfGetDB( DB_READ );
|
|
|
|
|
$raw = $dbr->getField( 'linkscc', 'lcc_cacheobj', array( 'lcc_pageid' => $id ) );
|
|
|
|
|
if ( $raw === false ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2003-11-27 19:53:40 +00:00
|
|
|
$cacheobj = false;
|
|
|
|
|
if( function_exists( "gzuncompress" ) )
|
2004-07-10 03:09:26 +00:00
|
|
|
$cacheobj = @gzuncompress( $raw );
|
2003-11-27 19:53:40 +00:00
|
|
|
|
|
|
|
|
if($cacheobj == FALSE){
|
2004-07-10 03:09:26 +00:00
|
|
|
$cacheobj = $raw;
|
2003-11-27 19:53:40 +00:00
|
|
|
}
|
|
|
|
|
$cc = @unserialize( $cacheobj );
|
|
|
|
|
if( isset( $cc->mClassVer ) and ($cc->mClassVer == $this->mClassVer ) ){
|
2004-01-05 20:55:45 +00:00
|
|
|
$this->mOldGoodLinks = $this->mGoodLinks = $cc->mGoodLinks;
|
|
|
|
|
$this->mOldBadLinks = $this->mBadLinks = $cc->mBadLinks;
|
|
|
|
|
$this->mPreFilled = true;
|
|
|
|
|
return TRUE;
|
2003-11-27 19:53:40 +00:00
|
|
|
} else {
|
|
|
|
|
return FALSE;
|
|
|
|
|
}
|
2004-01-05 20:55:45 +00:00
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
2004-03-20 08:41:33 +00:00
|
|
|
/* private */ function saveToLinkscc( $pid ){
|
2004-07-10 03:09:26 +00:00
|
|
|
global $wgCompressedPersistentLC;
|
2004-01-05 20:55:45 +00:00
|
|
|
if( $wgCompressedPersistentLC and function_exists( "gzcompress" ) ) {
|
2004-07-10 03:09:26 +00:00
|
|
|
$ser = gzcompress( serialize( $this ), 3 );
|
2004-01-05 20:55:45 +00:00
|
|
|
} else {
|
2004-07-10 03:09:26 +00:00
|
|
|
$ser = serialize( $this );
|
2004-06-11 14:36:25 +00:00
|
|
|
}
|
2004-07-10 03:09:26 +00:00
|
|
|
$db =& wfGetDB( DB_WRITE );
|
|
|
|
|
$db->replace( 'linkscc', array( 'lcc_pageid' ), array( 'lcc_pageid' => $pid, 'lcc_cacheobj' => $ser ) );
|
2004-01-05 20:55:45 +00:00
|
|
|
}
|
|
|
|
|
|
2004-07-10 03:09:26 +00:00
|
|
|
# Delete linkscc rows which link to here
|
2004-01-05 20:55:45 +00:00
|
|
|
# $pid is a page id
|
|
|
|
|
/* static */ function linksccClearLinksTo( $pid ){
|
2004-07-10 03:09:26 +00:00
|
|
|
global $wgEnablePersistentLC;
|
2004-06-05 04:44:45 +00:00
|
|
|
if ( $wgEnablePersistentLC ) {
|
2004-07-10 03:09:26 +00:00
|
|
|
$fname = "LinkCache::linksccClearLinksTo";
|
2004-06-05 04:44:45 +00:00
|
|
|
$pid = intval( $pid );
|
2004-07-10 03:09:26 +00:00
|
|
|
$dbw =& wfGetDB( DB_WRITE );
|
|
|
|
|
# Delete linkscc rows which link to here
|
|
|
|
|
$dbw->deleteJoin( 'linkscc', 'links', 'lcc_pageid', 'l_from', array( 'l_to' => $pid ), $fname );
|
|
|
|
|
# Delete linkscc row representing this page
|
|
|
|
|
$dbw->delete( 'linkscc', array( 'lcc_pageid' => $pid ), $fname);
|
2004-06-05 04:44:45 +00:00
|
|
|
}
|
2004-07-10 03:09:26 +00:00
|
|
|
|
2004-01-05 20:55:45 +00:00
|
|
|
}
|
|
|
|
|
|
2004-07-10 03:09:26 +00:00
|
|
|
# Delete linkscc rows with broken links to here
|
2004-01-05 20:55:45 +00:00
|
|
|
# $title is a prefixed db title, for example like Title->getPrefixedDBkey() returns.
|
|
|
|
|
/* static */ function linksccClearBrokenLinksTo( $title ){
|
2004-07-10 03:09:26 +00:00
|
|
|
global $wgEnablePersistentLC;
|
|
|
|
|
$fname = 'LinkCache::linksccClearBrokenLinksTo';
|
|
|
|
|
|
2004-06-05 04:44:45 +00:00
|
|
|
if ( $wgEnablePersistentLC ) {
|
2004-07-10 03:09:26 +00:00
|
|
|
$dbw =& wfGetDB( DB_WRITE );
|
|
|
|
|
$dbw->deleteJoin( 'linkscc', 'brokenlinks', 'lcc_pageid', 'bl_from', array( 'bl_to' => $title ), $fname );
|
2004-06-05 04:44:45 +00:00
|
|
|
}
|
2004-01-05 20:55:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# $pid is a page id
|
|
|
|
|
/* static */ function linksccClearPage( $pid ){
|
2004-06-05 04:44:45 +00:00
|
|
|
global $wgEnablePersistentLC;
|
|
|
|
|
if ( $wgEnablePersistentLC ) {
|
|
|
|
|
$pid = intval( $pid );
|
2004-07-10 03:09:26 +00:00
|
|
|
$dbw =& wfGetDB( DB_WRITE );
|
|
|
|
|
$dbw->delete( 'linkscc', array( 'lcc_pageid' => $pid ) );
|
2004-06-05 04:44:45 +00:00
|
|
|
}
|
2003-11-27 19:53:40 +00:00
|
|
|
}
|
2003-07-06 11:42:42 +00:00
|
|
|
}
|
2003-04-14 23:10:40 +00:00
|
|
|
?>
|