wiki.techinc.nl/includes/json/JsonCodec.php
C. Scott Ananian e9539efe2c Use JsonCodec to serialize SelserContext
This cleans up a FIXME left over from
I9e6b924d62ccc3312f5c70989477da1e2f21c86b.

SimpleParsoidOutputStashTest was temporary changed from a unit test to
an integration test, since the serialization/deserialization mechanism
for Content relies on ContentHandlerFactory in a way which is
difficult to unit test.  This will be restored in
I0cc1fc1b7403674467d85618b38a3b5a4718b66e once native JSON
serialization for Content is landed.

Follows-Up: I9e6b924d62ccc3312f5c70989477da1e2f21c86b
Change-Id: If985e99f9ca9596d0fe40f0a5ef2cdb72286627d
(cherry picked from commit 2ebf7e12df28f9861bb204ff4134871089a1c771)
2025-09-10 14:08:31 -04:00

366 lines
12 KiB
PHP

<?php
/**
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc.,
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
* http://www.gnu.org/copyleft/gpl.html
*
* @file
* @ingroup Json
*/
namespace MediaWiki\Json;
use InvalidArgumentException;
use JsonException;
use JsonSerializable;
use Psr\Container\ContainerInterface;
use ReflectionClass;
use stdClass;
use Wikimedia\Assert\Assert;
use Wikimedia\JsonCodec\JsonClassCodec;
use Wikimedia\JsonCodec\JsonCodecable;
use Wikimedia\Parsoid\Core\PageBundle;
/**
* Helper class to serialize/deserialize things to/from JSON.
*
* @stable to type
* @since 1.36
* @package MediaWiki\Json
*/
class JsonCodec
extends \Wikimedia\JsonCodec\JsonCodec
implements JsonDeserializer, JsonSerializer
{
/**
* When true, add extra properties to the serialized output for
* backwards compatibility. This will eventually be made a
* configuration variable and/or removed. (T367584)
*/
private bool $backCompat = true;
/**
* Create a new JsonCodec, with optional access to the provided services.
*/
public function __construct( ?ContainerInterface $services = null ) {
parent::__construct( $services );
// Forward-compatibility with MW 1.44: ensure Parsoid PageBundle is
// codecable
$this->addCodecFor( PageBundle::class, new class implements JsonClassCodec {
/** @inheritDoc */
public function toJsonArray( $obj ): array {
'@phan-var PageBundle $obj'; /** @var PageBundle $obj */
return [
'html' => $obj->html,
'parsoid' => $obj->parsoid,
'mw' => $obj->mw,
'version' => $obj->version,
'headers' => $obj->headers,
'contentmodel' => $obj->contentmodel,
];
}
/** @inheritDoc */
public function newFromJsonArray( string $className, array $json ) {
// @phan-suppress-next-line PhanTypeMismatchReturn
return new PageBundle(
$json['html'] ?? '',
$json['parsoid'] ?? null,
$json['mw'] ?? null,
$json['version'] ?? null,
$json['headers'] ?? null,
$json['contentmodel'] ?? null
);
}
/** @inheritDoc */
public function jsonClassHintFor( string $className, string $keyName ) {
return null;
}
} );
}
/**
* Support the JsonCodecable interface by maintaining a mapping of
* class names to codecs.
* @param class-string $className
* @return ?JsonClassCodec
*/
protected function codecFor( string $className ): ?JsonClassCodec {
static $deserializableCodec = null;
static $serializableCodec = null;
$codec = parent::codecFor( $className );
if ( $codec !== null ) {
return $codec;
}
// Resolve class aliases to ensure we don't use split codecs
$className = ( new ReflectionClass( $className ) )->getName();
// Provide a codec for JsonDeserializable objects
if ( is_a( $className, JsonDeserializable::class, true ) ) {
if ( $deserializableCodec === null ) {
$deserializableCodec = new JsonDeserializableCodec( $this );
}
$codec = $deserializableCodec;
$this->addCodecFor( $className, $codec );
return $codec;
}
// Provide a codec for JsonSerializable objects:
// NOTE this is for compatibility only and does not deserialize!
if ( is_a( $className, JsonSerializable::class, true ) ) {
$codec = JsonSerializableCodec::getInstance();
$this->addCodecFor( $className, $codec );
return $codec;
}
return null;
}
/** @inheritDoc */
protected function markArray( array &$value, string $className, ?string $classHint ): void {
parent::markArray( $value, $className, $classHint );
// Temporarily for backward compatibility add COMPLEX_ANNOTATION as well
if ( $this->backCompat ) {
$value[JsonConstants::COMPLEX_ANNOTATION] = true;
if ( ( $value[JsonConstants::TYPE_ANNOTATION] ?? null ) === 'array' ) {
unset( $value[JsonConstants::TYPE_ANNOTATION] );
}
}
}
/** @inheritDoc */
protected function isArrayMarked( array $value ): bool {
// Temporarily for backward compatibility look for COMPLEX_ANNOTATION as well
if ( $this->backCompat && array_key_exists( JsonConstants::COMPLEX_ANNOTATION, $value ) ) {
return true;
}
if ( ( $value['_type_'] ?? null ) === 'string' ) {
// T313818: see ParserOutput::detectAndEncodeBinary()
return false;
}
return parent::isArrayMarked( $value );
}
/** @inheritDoc */
protected function unmarkArray( array &$value, ?string $classHint ): string {
// Temporarily use the presence of COMPLEX_ANNOTATION as a hint that
// the type is 'array'
if (
$this->backCompat &&
$classHint === null &&
array_key_exists( JsonConstants::COMPLEX_ANNOTATION, $value )
) {
$classHint = 'array';
}
// @phan-suppress-next-line PhanUndeclaredClassReference 'array'
$className = parent::unmarkArray( $value, $classHint );
// Remove the temporarily-added COMPLEX_ANNOTATION
if ( $this->backCompat ) {
unset( $value[JsonConstants::COMPLEX_ANNOTATION] );
}
return $className;
}
/** @deprecated since 1.43; use ::deserialize() */
public function unserialize( $json, ?string $expectedClass = null ) {
return $this->deserialize( $json, $expectedClass );
}
public function deserialize( $json, ?string $expectedClass = null ) {
Assert::parameterType( [ 'stdClass', 'array', 'string' ], $json, '$json' );
Assert::precondition(
!$expectedClass ||
is_subclass_of( $expectedClass, JsonDeserializable::class ) ||
is_subclass_of( $expectedClass, JsonCodecable::class ),
'$expectedClass parameter must be subclass of JsonDeserializable or JsonCodecable, got ' . $expectedClass
);
if ( is_string( $json ) ) {
$jsonStatus = FormatJson::parse( $json, FormatJson::FORCE_ASSOC );
if ( !$jsonStatus->isGood() ) {
throw new JsonException( "Bad JSON: {$jsonStatus}" );
}
$json = $jsonStatus->getValue();
}
if ( $json instanceof stdClass ) {
$json = (array)$json;
}
if ( $expectedClass !== null ) {
// Make copy of $json to avoid unmarking the 'real thing'
$jsonCopy = $json;
if ( is_array( $jsonCopy ) && $this->isArrayMarked( $jsonCopy ) ) {
$got = $this->unmarkArray( $jsonCopy, $expectedClass );
// Compare $got to $expectedClass in a way that works in the
// presence of aliases
if ( is_a( $got, $expectedClass, true ) ) {
// Everything ok!
} else {
throw new JsonException( "Expected {$expectedClass} got {$got}" );
}
} else {
$got = get_debug_type( $json );
throw new JsonException( "Expected {$expectedClass} got {$got}" );
}
}
try {
$result = is_array( $json ) ? $this->newFromJsonArray( $json ) : $json;
} catch ( InvalidArgumentException $e ) {
throw new JsonException( $e->getMessage() );
}
if ( $expectedClass && !is_a( $result, $expectedClass, false ) ) {
throw new JsonException( "Unexpected class: {$expectedClass}" );
}
return $result;
}
/** @deprecated since 1.43; use ::deserializeArray() */
public function unserializeArray( array $array ): array {
return $this->deserializeArray( $array );
}
public function deserializeArray( array $array ): array {
try {
// Pass a class hint here to ensure we recurse into the array.
// @phan-suppress-next-line PhanUndeclaredClassReference 'array'
return $this->newFromJsonArray( $array, 'array' );
} catch ( InvalidArgumentException $e ) {
throw new JsonException( $e->getMessage() );
}
}
public function serialize( $value ) {
// Recursively convert stdClass, JsonSerializable, and JsonCodecable
// to serializable arrays
try {
$value = $this->toJsonArray( $value );
} catch ( InvalidArgumentException $e ) {
throw new JsonException( $e->getMessage() );
}
// Format as JSON
$json = FormatJson::encode( $value, false, FormatJson::ALL_OK );
if ( !$json ) {
try {
// Try to collect more information on the failure.
$details = $this->detectNonSerializableData( $value );
} catch ( \Throwable $t ) {
$details = $t->getMessage();
}
throw new JsonException(
'Failed to encode JSON. ' .
'Error: ' . json_last_error_msg() . '. ' .
'Details: ' . $details
);
}
return $json;
}
// The code below this point is used only for diagnostics; in particular
// for the ::detectNonSerializableData() method which is used to provide
// debugging information in the event of a serialization failure.
/**
* Recursive check for ability to serialize $value to JSON via FormatJson::encode().
*
* @param mixed $value
* @param bool $expectDeserialize
* @param string $accumulatedPath
* @param bool $exhaustive Whether to (slowly) completely traverse the
* $value in order to find the precise location of a problem
* @return string|null JSON path to first encountered non-serializable property or null.
*/
private function detectNonSerializableDataInternal(
$value,
bool $expectDeserialize,
string $accumulatedPath,
bool $exhaustive = false
): ?string {
if (
( is_array( $value ) && $this->isArrayMarked( $value ) ) ||
( $value instanceof stdClass && $this->isArrayMarked( (array)$value ) )
) {
// Contains a conflicting use of JsonConstants::TYPE_ANNOTATION or
// JsonConstants::COMPLEX_ANNOTATION; in the future we might use
// an alternative encoding for these objects to allow them.
return $accumulatedPath . ': conflicting use of protected property';
}
if ( is_object( $value ) ) {
if ( get_class( $value ) === stdClass::class ) {
$value = (array)$value;
} elseif ( $value instanceof JsonCodecable ) {
if ( $exhaustive ) {
// Call the appropriate serialization method and recurse to
// ensure contents are also serializable.
$codec = $this->codecFor( get_class( $value ) );
$value = $codec->toJsonArray( $value );
} else {
// Assume that serializable objects contain 100%
// serializable contents in their representation.
return null;
}
} elseif (
$expectDeserialize ?
$value instanceof JsonDeserializable :
$value instanceof JsonSerializable
) {
if ( $exhaustive ) {
// Call the appropriate serialization method and recurse to
// ensure contents are also serializable.
'@phan-var JsonSerializable $value';
$value = $value->jsonSerialize();
if ( !is_array( $value ) ) {
return $accumulatedPath . ": jsonSerialize didn't return array";
}
} else {
// Assume that serializable objects contain 100%
// serializable contents in their representation.
return null;
}
} else {
// Instances of classes other the \stdClass or JsonSerializable can not be serialized to JSON.
return $accumulatedPath . ': ' . get_debug_type( $value );
}
}
if ( is_array( $value ) ) {
foreach ( $value as $key => $propValue ) {
$propValueNonSerializablePath = $this->detectNonSerializableDataInternal(
$propValue,
$expectDeserialize,
$accumulatedPath . '.' . $key,
$exhaustive
);
if ( $propValueNonSerializablePath !== null ) {
return $propValueNonSerializablePath;
}
}
} elseif ( !is_scalar( $value ) && $value !== null ) {
return $accumulatedPath . ': nonscalar ' . get_debug_type( $value );
}
return null;
}
/**
* Checks if the $value is JSON-serializable (contains only scalar values)
* and returns a JSON-path to the first non-serializable property encountered.
*
* @param mixed $value
* @param bool $expectDeserialize whether to expect the $value to be deserializable with JsonDeserializer.
* @return string|null JSON path to first encountered non-serializable property or null.
* @see JsonDeserializer
* @since 1.36
*/
public function detectNonSerializableData( $value, bool $expectDeserialize = false ): ?string {
return $this->detectNonSerializableDataInternal( $value, $expectDeserialize, '$', true );
}
}