2009-08-11 00:09:24 +00:00
|
|
|
<?php
|
2010-02-24 16:06:55 +00:00
|
|
|
# Copyright © 2009 Aryeh Gregor
|
2009-08-11 00:09:24 +00:00
|
|
|
# http://www.mediawiki.org/
|
|
|
|
|
#
|
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
|
# the Free Software Foundation; either version 2 of the License, or
|
|
|
|
|
# (at your option) any later version.
|
|
|
|
|
#
|
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
|
#
|
|
|
|
|
# You should have received a copy of the GNU General Public License along
|
|
|
|
|
# with this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
|
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
|
|
|
# http://www.gnu.org/copyleft/gpl.html
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* This class is a collection of static functions that serve two purposes:
|
|
|
|
|
*
|
2009-12-30 07:08:52 +00:00
|
|
|
* 1) Implement any algorithms specified by HTML5, or other HTML
|
2009-08-11 00:09:24 +00:00
|
|
|
* specifications, in a convenient and self-contained way.
|
|
|
|
|
*
|
|
|
|
|
* 2) Allow HTML elements to be conveniently and safely generated, like the
|
|
|
|
|
* current Xml class but a) less confused (Xml supports HTML-specific things,
|
|
|
|
|
* but only sometimes!) and b) not necessarily confined to XML-compatible
|
|
|
|
|
* output.
|
|
|
|
|
*
|
|
|
|
|
* There are two important configuration options this class uses:
|
|
|
|
|
*
|
|
|
|
|
* $wgHtml5: If this is set to false, then all output should be valid XHTML 1.0
|
|
|
|
|
* Transitional.
|
|
|
|
|
* $wgWellFormedXml: If this is set to true, then all output should be
|
|
|
|
|
* well-formed XML (quotes on attributes, self-closing tags, etc.).
|
|
|
|
|
*
|
|
|
|
|
* This class is meant to be confined to utility functions that are called from
|
|
|
|
|
* trusted code paths. It does not do enforcement of policy like not allowing
|
|
|
|
|
* <a> elements.
|
2010-02-24 16:06:55 +00:00
|
|
|
*
|
|
|
|
|
* @since 1.16
|
2009-08-11 00:09:24 +00:00
|
|
|
*/
|
|
|
|
|
class Html {
|
2009-12-30 07:08:52 +00:00
|
|
|
# List of void elements from HTML5, section 9.1.2 as of 2009-08-10
|
2009-08-11 00:09:24 +00:00
|
|
|
private static $voidElements = array(
|
2009-08-19 01:39:05 +00:00
|
|
|
'area',
|
|
|
|
|
'base',
|
|
|
|
|
'br',
|
|
|
|
|
'col',
|
|
|
|
|
'command',
|
|
|
|
|
'embed',
|
|
|
|
|
'hr',
|
|
|
|
|
'img',
|
|
|
|
|
'input',
|
|
|
|
|
'keygen',
|
|
|
|
|
'link',
|
|
|
|
|
'meta',
|
|
|
|
|
'param',
|
|
|
|
|
'source',
|
2009-08-11 00:09:24 +00:00
|
|
|
);
|
|
|
|
|
|
2009-08-11 01:00:44 +00:00
|
|
|
# Boolean attributes, which may have the value omitted entirely. Manually
|
2009-12-30 07:08:52 +00:00
|
|
|
# collected from the HTML5 spec as of 2009-08-10.
|
2009-08-19 01:39:05 +00:00
|
|
|
private static $boolAttribs = array(
|
|
|
|
|
'async',
|
|
|
|
|
'autobuffer',
|
|
|
|
|
'autofocus',
|
|
|
|
|
'autoplay',
|
|
|
|
|
'checked',
|
|
|
|
|
'controls',
|
|
|
|
|
'defer',
|
|
|
|
|
'disabled',
|
|
|
|
|
'formnovalidate',
|
|
|
|
|
'hidden',
|
|
|
|
|
'ismap',
|
|
|
|
|
'loop',
|
|
|
|
|
'multiple',
|
|
|
|
|
'novalidate',
|
|
|
|
|
'open',
|
|
|
|
|
'readonly',
|
|
|
|
|
'required',
|
|
|
|
|
'reversed',
|
|
|
|
|
'scoped',
|
|
|
|
|
'seamless',
|
2009-08-11 01:00:44 +00:00
|
|
|
);
|
|
|
|
|
|
2009-08-11 00:09:24 +00:00
|
|
|
/**
|
|
|
|
|
* Returns an HTML element in a string. The major advantage here over
|
|
|
|
|
* manually typing out the HTML is that it will escape all attribute
|
|
|
|
|
* values. If you're hardcoding all the attributes, or there are none, you
|
|
|
|
|
* should probably type out the string yourself.
|
|
|
|
|
*
|
2009-08-21 20:39:16 +00:00
|
|
|
* This is quite similar to Xml::tags(), but it implements some useful
|
2009-08-11 00:09:24 +00:00
|
|
|
* HTML-specific logic. For instance, there is no $allowShortTag
|
|
|
|
|
* parameter: the closing tag is magically omitted if $element has an empty
|
|
|
|
|
* content model. If $wgWellFormedXml is false, then a few bytes will be
|
|
|
|
|
* shaved off the HTML output as well. In the future, other HTML-specific
|
|
|
|
|
* features might be added, like allowing arrays for the values of
|
|
|
|
|
* attributes like class= and media=.
|
|
|
|
|
*
|
|
|
|
|
* @param $element string The element's name, e.g., 'a'
|
|
|
|
|
* @param $attribs array Associative array of attributes, e.g., array(
|
2009-09-23 15:16:05 +00:00
|
|
|
* 'href' => 'http://www.mediawiki.org/' ). See expandAttributes() for
|
|
|
|
|
* further documentation.
|
2009-08-11 00:09:24 +00:00
|
|
|
* @param $contents string The raw HTML contents of the element: *not*
|
|
|
|
|
* escaped!
|
|
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
2009-08-18 01:01:47 +00:00
|
|
|
public static function rawElement( $element, $attribs = array(), $contents = '' ) {
|
2010-01-15 01:16:52 +00:00
|
|
|
global $wgWellFormedXml;
|
|
|
|
|
$start = self::openElement( $element, $attribs );
|
|
|
|
|
if ( in_array( $element, self::$voidElements ) ) {
|
|
|
|
|
if ( $wgWellFormedXml ) {
|
|
|
|
|
# Silly XML.
|
|
|
|
|
return substr( $start, 0, -1 ) . ' />';
|
|
|
|
|
}
|
|
|
|
|
return $start;
|
|
|
|
|
} else {
|
2010-03-21 05:12:02 +00:00
|
|
|
return "$start$contents" . self::closeElement( $element );
|
2010-01-15 01:16:52 +00:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Identical to rawElement(), but HTML-escapes $contents (like
|
|
|
|
|
* Xml::element()).
|
|
|
|
|
*/
|
|
|
|
|
public static function element( $element, $attribs = array(), $contents = '' ) {
|
|
|
|
|
return self::rawElement( $element, $attribs, strtr( $contents, array(
|
|
|
|
|
# There's no point in escaping quotes, >, etc. in the contents of
|
|
|
|
|
# elements.
|
|
|
|
|
'&' => '&',
|
|
|
|
|
'<' => '<'
|
|
|
|
|
) ) );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Identical to rawElement(), but has no third parameter and omits the end
|
2010-03-21 05:12:02 +00:00
|
|
|
* tag (and the self-closing '/' in XML mode for empty elements).
|
2010-01-15 01:16:52 +00:00
|
|
|
*/
|
|
|
|
|
public static function openElement( $element, $attribs = array() ) {
|
2010-03-21 05:12:02 +00:00
|
|
|
global $wgHtml5, $wgWellFormedXml;
|
2009-09-22 17:41:34 +00:00
|
|
|
$attribs = (array)$attribs;
|
2009-12-30 07:08:52 +00:00
|
|
|
# This is not required in HTML5, but let's do it anyway, for
|
2009-08-21 20:50:35 +00:00
|
|
|
# consistency and better compression.
|
2009-08-11 00:09:24 +00:00
|
|
|
$element = strtolower( $element );
|
2009-08-21 20:50:35 +00:00
|
|
|
|
2010-03-21 05:12:02 +00:00
|
|
|
# In text/html, initial <html> and <head> tags can be omitted under
|
|
|
|
|
# pretty much any sane circumstances, if they have no attributes. See:
|
|
|
|
|
# <http://www.whatwg.org/specs/web-apps/current-work/multipage/syntax.html#optional-tags>
|
|
|
|
|
if ( !$wgWellFormedXml && !$attribs
|
|
|
|
|
&& in_array( $element, array( 'html', 'head' ) ) ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
Fix bugs in r59360, r59361, r59363
* spellcheck is not a boolean attribute; it is an enumerated attribute
whose possible values are "true" and "false". If it were boolean, the
permitted constructs would be <input spellcheck>, <input
spellcheck="spellcheck">, and <input spellcheck="">, which would all
set it true, and it would only be set to false if omitted entirely.
(It would be boolean if HTML5 had invented it, but can't be for
historical reasons.)
* spellcheck is valid on any HTML element, not just input, and so should
be stripped on any element.
For reference, a table of all HTML5 attributes can be found at:
<http://www.whatwg.org/specs/web-apps/current-work/multipage/section-index.html#attributes-0>
2009-12-11 19:01:16 +00:00
|
|
|
# Remove HTML5-only attributes if we aren't doing HTML5
|
|
|
|
|
if ( !$wgHtml5 ) {
|
|
|
|
|
if ( $element == 'input' ) {
|
|
|
|
|
# Whitelist of valid XHTML1 types
|
2009-08-21 20:50:35 +00:00
|
|
|
$validTypes = array(
|
|
|
|
|
'hidden',
|
|
|
|
|
'text',
|
|
|
|
|
'password',
|
|
|
|
|
'checkbox',
|
|
|
|
|
'radio',
|
|
|
|
|
'file',
|
|
|
|
|
'submit',
|
|
|
|
|
'image',
|
|
|
|
|
'reset',
|
|
|
|
|
'button',
|
|
|
|
|
);
|
|
|
|
|
if ( isset( $attribs['type'] )
|
|
|
|
|
&& !in_array( $attribs['type'], $validTypes ) ) {
|
|
|
|
|
# Fall back to type=text, the default
|
|
|
|
|
unset( $attribs['type'] );
|
|
|
|
|
}
|
Fix bugs in r59360, r59361, r59363
* spellcheck is not a boolean attribute; it is an enumerated attribute
whose possible values are "true" and "false". If it were boolean, the
permitted constructs would be <input spellcheck>, <input
spellcheck="spellcheck">, and <input spellcheck="">, which would all
set it true, and it would only be set to false if omitted entirely.
(It would be boolean if HTML5 had invented it, but can't be for
historical reasons.)
* spellcheck is valid on any HTML element, not just input, and so should
be stripped on any element.
For reference, a table of all HTML5 attributes can be found at:
<http://www.whatwg.org/specs/web-apps/current-work/multipage/section-index.html#attributes-0>
2009-12-11 19:01:16 +00:00
|
|
|
}
|
2009-12-15 00:11:47 +00:00
|
|
|
if ( $element == 'textarea' && isset( $attribs['maxlength'] ) ) {
|
|
|
|
|
unset( $attribs['maxlength'] );
|
|
|
|
|
}
|
Fix bugs in r59360, r59361, r59363
* spellcheck is not a boolean attribute; it is an enumerated attribute
whose possible values are "true" and "false". If it were boolean, the
permitted constructs would be <input spellcheck>, <input
spellcheck="spellcheck">, and <input spellcheck="">, which would all
set it true, and it would only be set to false if omitted entirely.
(It would be boolean if HTML5 had invented it, but can't be for
historical reasons.)
* spellcheck is valid on any HTML element, not just input, and so should
be stripped on any element.
For reference, a table of all HTML5 attributes can be found at:
<http://www.whatwg.org/specs/web-apps/current-work/multipage/section-index.html#attributes-0>
2009-12-11 19:01:16 +00:00
|
|
|
# Here we're blacklisting some HTML5-only attributes...
|
|
|
|
|
$html5attribs = array(
|
|
|
|
|
'autocomplete',
|
|
|
|
|
'autofocus',
|
|
|
|
|
'max',
|
|
|
|
|
'min',
|
|
|
|
|
'multiple',
|
|
|
|
|
'pattern',
|
|
|
|
|
'placeholder',
|
|
|
|
|
'required',
|
|
|
|
|
'step',
|
|
|
|
|
'spellcheck',
|
|
|
|
|
);
|
|
|
|
|
foreach ( $html5attribs as $badAttr ) {
|
|
|
|
|
unset( $attribs[$badAttr] );
|
2009-08-21 20:50:35 +00:00
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2010-01-15 01:16:52 +00:00
|
|
|
return "<$element" . self::expandAttributes(
|
|
|
|
|
self::dropDefaults( $element, $attribs ) ) . '>';
|
2009-08-18 01:01:47 +00:00
|
|
|
}
|
|
|
|
|
|
2010-03-21 05:12:02 +00:00
|
|
|
/**
|
|
|
|
|
* Returns "</$element>", except if $wgWellFormedXml is off, in which case
|
|
|
|
|
* it returns the empty string when that's guaranteed to be safe.
|
|
|
|
|
*
|
|
|
|
|
* @param $element string Name of the element, e.g., 'a'
|
|
|
|
|
* @return string A closing tag, if required
|
|
|
|
|
*/
|
|
|
|
|
public static function closeElement( $element ) {
|
|
|
|
|
global $wgWellFormedXml;
|
|
|
|
|
|
|
|
|
|
$element = strtolower( $element );
|
|
|
|
|
|
|
|
|
|
# Reference:
|
|
|
|
|
# http://www.whatwg.org/specs/web-apps/current-work/multipage/syntax.html#optional-tags
|
|
|
|
|
if ( !$wgWellFormedXml && in_array( $element, array(
|
|
|
|
|
'html',
|
|
|
|
|
'head',
|
|
|
|
|
'body',
|
|
|
|
|
'li',
|
|
|
|
|
'dt',
|
|
|
|
|
'dd',
|
|
|
|
|
'tr',
|
|
|
|
|
'td',
|
|
|
|
|
'th',
|
|
|
|
|
) ) ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
return "</$element>";
|
|
|
|
|
}
|
|
|
|
|
|
2009-09-07 00:21:55 +00:00
|
|
|
/**
|
|
|
|
|
* Given an element name and an associative array of element attributes,
|
|
|
|
|
* return an array that is functionally identical to the input array, but
|
|
|
|
|
* possibly smaller. In particular, attributes might be stripped if they
|
|
|
|
|
* are given their default values.
|
|
|
|
|
*
|
|
|
|
|
* This method is not guaranteed to remove all redundant attributes, only
|
|
|
|
|
* some common ones and some others selected arbitrarily at random. It
|
|
|
|
|
* only guarantees that the output array should be functionally identical
|
|
|
|
|
* to the input array (currently per the HTML 5 draft as of 2009-09-06).
|
|
|
|
|
*
|
|
|
|
|
* @param $element string Name of the element, e.g., 'a'
|
|
|
|
|
* @param $attribs array Associative array of attributes, e.g., array(
|
2009-09-23 15:16:05 +00:00
|
|
|
* 'href' => 'http://www.mediawiki.org/' ). See expandAttributes() for
|
|
|
|
|
* further documentation.
|
2009-09-07 00:21:55 +00:00
|
|
|
* @return array An array of attributes functionally identical to $attribs
|
|
|
|
|
*/
|
|
|
|
|
private static function dropDefaults( $element, $attribs ) {
|
2009-09-18 14:19:34 +00:00
|
|
|
# Don't bother doing anything if we aren't outputting HTML5; it's too
|
|
|
|
|
# much of a pain to maintain two sets of defaults.
|
|
|
|
|
global $wgHtml5;
|
|
|
|
|
if ( !$wgHtml5 ) {
|
|
|
|
|
return $attribs;
|
|
|
|
|
}
|
|
|
|
|
|
2009-09-07 00:21:55 +00:00
|
|
|
static $attribDefaults = array(
|
|
|
|
|
'area' => array( 'shape' => 'rect' ),
|
|
|
|
|
'button' => array(
|
|
|
|
|
'formaction' => 'GET',
|
|
|
|
|
'formenctype' => 'application/x-www-form-urlencoded',
|
|
|
|
|
'type' => 'submit',
|
|
|
|
|
),
|
|
|
|
|
'canvas' => array(
|
|
|
|
|
'height' => '150',
|
|
|
|
|
'width' => '300',
|
|
|
|
|
),
|
|
|
|
|
'command' => array( 'type' => 'command' ),
|
|
|
|
|
'form' => array(
|
|
|
|
|
'action' => 'GET',
|
|
|
|
|
'autocomplete' => 'on',
|
|
|
|
|
'enctype' => 'application/x-www-form-urlencoded',
|
|
|
|
|
),
|
|
|
|
|
'input' => array(
|
|
|
|
|
'formaction' => 'GET',
|
|
|
|
|
'type' => 'text',
|
|
|
|
|
'value' => '',
|
|
|
|
|
),
|
|
|
|
|
'keygen' => array( 'keytype' => 'rsa' ),
|
|
|
|
|
'link' => array( 'media' => 'all' ),
|
|
|
|
|
'menu' => array( 'type' => 'list' ),
|
|
|
|
|
# Note: the use of text/javascript here instead of other JavaScript
|
2009-12-30 07:08:52 +00:00
|
|
|
# MIME types follows the HTML5 spec.
|
2009-09-07 00:21:55 +00:00
|
|
|
'script' => array( 'type' => 'text/javascript' ),
|
|
|
|
|
'style' => array(
|
|
|
|
|
'media' => 'all',
|
|
|
|
|
'type' => 'text/css',
|
|
|
|
|
),
|
|
|
|
|
'textarea' => array( 'wrap' => 'soft' ),
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
$element = strtolower( $element );
|
|
|
|
|
|
|
|
|
|
foreach ( $attribs as $attrib => $value ) {
|
|
|
|
|
$lcattrib = strtolower( $attrib );
|
2009-09-07 15:25:22 +00:00
|
|
|
$value = strval( $value );
|
2009-09-07 00:21:55 +00:00
|
|
|
|
2009-09-07 15:25:22 +00:00
|
|
|
# Simple checks using $attribDefaults
|
2009-09-07 00:21:55 +00:00
|
|
|
if ( isset( $attribDefaults[$element][$lcattrib] ) &&
|
2009-09-07 15:25:22 +00:00
|
|
|
$attribDefaults[$element][$lcattrib] == $value ) {
|
|
|
|
|
unset( $attribs[$attrib] );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( $lcattrib == 'class' && $value == '' ) {
|
2009-09-07 00:21:55 +00:00
|
|
|
unset( $attribs[$attrib] );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# More subtle checks
|
|
|
|
|
if ( $element === 'link' && isset( $attribs['type'] )
|
2009-09-07 15:25:22 +00:00
|
|
|
&& strval( $attribs['type'] ) == 'text/css' ) {
|
2009-09-07 00:21:55 +00:00
|
|
|
unset( $attribs['type'] );
|
|
|
|
|
}
|
|
|
|
|
if ( $element === 'select' && isset( $attribs['size'] ) ) {
|
|
|
|
|
if ( in_array( 'multiple', $attribs )
|
|
|
|
|
|| ( isset( $attribs['multiple'] ) && $attribs['multiple'] !== false )
|
|
|
|
|
) {
|
|
|
|
|
# A multi-select
|
2009-09-07 15:25:22 +00:00
|
|
|
if ( strval( $attribs['size'] ) == '4' ) {
|
2009-09-07 00:21:55 +00:00
|
|
|
unset( $attribs['size'] );
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
# Single select
|
2009-09-07 15:25:22 +00:00
|
|
|
if ( strval( $attribs['size'] ) == '1' ) {
|
2009-09-07 00:21:55 +00:00
|
|
|
unset( $attribs['size'] );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $attribs;
|
|
|
|
|
}
|
|
|
|
|
|
2009-08-11 00:09:24 +00:00
|
|
|
/**
|
|
|
|
|
* Given an associative array of element attributes, generate a string
|
|
|
|
|
* to stick after the element name in HTML output. Like array( 'href' =>
|
|
|
|
|
* 'http://www.mediawiki.org/' ) becomes something like
|
|
|
|
|
* ' href="http://www.mediawiki.org"'. Again, this is like
|
|
|
|
|
* Xml::expandAttributes(), but it implements some HTML-specific logic.
|
2009-08-11 01:00:44 +00:00
|
|
|
* For instance, it will omit quotation marks if $wgWellFormedXml is false,
|
|
|
|
|
* and will treat boolean attributes specially.
|
2009-08-11 00:09:24 +00:00
|
|
|
*
|
|
|
|
|
* @param $attribs array Associative array of attributes, e.g., array(
|
|
|
|
|
* 'href' => 'http://www.mediawiki.org/' ). Values will be HTML-escaped.
|
2009-09-23 15:16:05 +00:00
|
|
|
* A value of false means to omit the attribute. For boolean attributes,
|
|
|
|
|
* you can omit the key, e.g., array( 'checked' ) instead of
|
|
|
|
|
* array( 'checked' => 'checked' ) or such.
|
2009-08-11 00:09:24 +00:00
|
|
|
* @return string HTML fragment that goes between element name and '>'
|
|
|
|
|
* (starting with a space if at least one attribute is output)
|
|
|
|
|
*/
|
2009-09-18 14:55:42 +00:00
|
|
|
public static function expandAttributes( $attribs ) {
|
2009-08-11 01:00:44 +00:00
|
|
|
global $wgHtml5, $wgWellFormedXml;
|
2009-08-11 00:09:24 +00:00
|
|
|
|
|
|
|
|
$ret = '';
|
2009-09-18 14:55:42 +00:00
|
|
|
$attribs = (array)$attribs;
|
2009-08-11 00:09:24 +00:00
|
|
|
foreach ( $attribs as $key => $value ) {
|
2009-08-26 14:59:59 +00:00
|
|
|
if ( $value === false ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2009-08-21 21:06:06 +00:00
|
|
|
# For boolean attributes, support array( 'foo' ) instead of
|
|
|
|
|
# requiring array( 'foo' => 'meaningless' ).
|
|
|
|
|
if ( is_int( $key )
|
|
|
|
|
&& in_array( strtolower( $value ), self::$boolAttribs ) ) {
|
|
|
|
|
$key = $value;
|
|
|
|
|
}
|
|
|
|
|
|
2009-12-30 07:08:52 +00:00
|
|
|
# Not technically required in HTML5, but required in XHTML 1.0,
|
2009-08-21 21:06:06 +00:00
|
|
|
# and we'd like consistency and better compression anyway.
|
|
|
|
|
$key = strtolower( $key );
|
|
|
|
|
|
2009-12-30 07:08:52 +00:00
|
|
|
# See the "Attributes" section in the HTML syntax part of HTML5,
|
2009-08-11 00:09:24 +00:00
|
|
|
# 9.1.2.3 as of 2009-08-10. Most attributes can have quotation
|
|
|
|
|
# marks omitted, but not all. (Although a literal " is not
|
|
|
|
|
# permitted, we don't check for that, since it will be escaped
|
|
|
|
|
# anyway.)
|
2009-09-18 15:28:46 +00:00
|
|
|
#
|
|
|
|
|
# See also research done on further characters that need to be
|
|
|
|
|
# escaped: http://code.google.com/p/html5lib/issues/detail?id=93
|
|
|
|
|
$badChars = "\\x00- '=<>`/\x{00a0}\x{1680}\x{180e}\x{180F}\x{2000}\x{2001}"
|
|
|
|
|
. "\x{2002}\x{2003}\x{2004}\x{2005}\x{2006}\x{2007}\x{2008}\x{2009}"
|
|
|
|
|
. "\x{200A}\x{2028}\x{2029}\x{202F}\x{205F}\x{3000}";
|
2009-09-06 15:08:10 +00:00
|
|
|
if ( $wgWellFormedXml || $value === ''
|
2009-09-18 15:28:46 +00:00
|
|
|
|| preg_match( "![$badChars]!u", $value ) ) {
|
2009-08-11 00:09:24 +00:00
|
|
|
$quote = '"';
|
|
|
|
|
} else {
|
|
|
|
|
$quote = '';
|
|
|
|
|
}
|
|
|
|
|
|
2009-08-11 01:00:44 +00:00
|
|
|
if ( in_array( $key, self::$boolAttribs ) ) {
|
|
|
|
|
# In XHTML 1.0 Transitional, the value needs to be equal to the
|
2009-12-30 07:08:52 +00:00
|
|
|
# key. In HTML5, we can leave the value empty instead. If we
|
2009-08-11 01:00:44 +00:00
|
|
|
# don't need well-formed XML, we can omit the = entirely.
|
|
|
|
|
if ( !$wgWellFormedXml ) {
|
|
|
|
|
$ret .= " $key";
|
|
|
|
|
} elseif ( $wgHtml5 ) {
|
|
|
|
|
$ret .= " $key=\"\"";
|
|
|
|
|
} else {
|
|
|
|
|
$ret .= " $key=\"$key\"";
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
# Apparently we need to entity-encode \n, \r, \t, although the
|
|
|
|
|
# spec doesn't mention that. Since we're doing strtr() anyway,
|
|
|
|
|
# and we don't need <> escaped here, we may as well not call
|
|
|
|
|
# htmlspecialchars(). FIXME: verify that we actually need to
|
|
|
|
|
# escape \n\r\t here, and explain why, exactly.
|
2009-10-01 01:30:58 +00:00
|
|
|
#
|
|
|
|
|
# We could call Sanitizer::encodeAttribute() for this, but we
|
|
|
|
|
# don't because we're stubborn and like our marginal savings on
|
|
|
|
|
# byte size from not having to encode unnecessary quotes.
|
|
|
|
|
$map = array(
|
|
|
|
|
'&' => '&',
|
|
|
|
|
'"' => '"',
|
|
|
|
|
"\n" => ' ',
|
|
|
|
|
"\r" => ' ',
|
|
|
|
|
"\t" => '	'
|
|
|
|
|
);
|
|
|
|
|
if ( $wgWellFormedXml ) {
|
2010-02-21 01:44:25 +00:00
|
|
|
# This is allowed per spec: <http://www.w3.org/TR/xml/#NT-AttValue>
|
|
|
|
|
# But reportedly it breaks some XML tools? FIXME: is this
|
|
|
|
|
# really true?
|
2009-10-01 01:30:58 +00:00
|
|
|
$map['<'] = '<';
|
2009-09-16 05:29:44 +00:00
|
|
|
}
|
2009-10-01 01:30:58 +00:00
|
|
|
$ret .= " $key=$quote" . strtr( $value, $map ) . $quote;
|
2009-08-11 01:00:44 +00:00
|
|
|
}
|
2009-08-11 00:09:24 +00:00
|
|
|
}
|
|
|
|
|
return $ret;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Output a <script> tag with the given contents. TODO: do some useful
|
|
|
|
|
* escaping as well, like if $contents contains literal '</script>' or (for
|
|
|
|
|
* XML) literal "]]>".
|
|
|
|
|
*
|
|
|
|
|
* @param $contents string JavaScript
|
|
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
|
|
|
|
public static function inlineScript( $contents ) {
|
2009-08-23 21:06:54 +00:00
|
|
|
global $wgHtml5, $wgJsMimeType, $wgWellFormedXml;
|
2009-08-11 00:09:24 +00:00
|
|
|
|
|
|
|
|
$attrs = array();
|
|
|
|
|
if ( !$wgHtml5 ) {
|
|
|
|
|
$attrs['type'] = $wgJsMimeType;
|
2009-08-23 21:06:54 +00:00
|
|
|
}
|
|
|
|
|
if ( $wgWellFormedXml && preg_match( '/[<&]/', $contents ) ) {
|
2009-08-11 00:09:24 +00:00
|
|
|
$contents = "/*<![CDATA[*/$contents/*]]>*/";
|
|
|
|
|
}
|
2009-08-18 01:01:47 +00:00
|
|
|
return self::rawElement( 'script', $attrs, $contents );
|
2009-08-11 00:09:24 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Output a <script> tag linking to the given URL, e.g.,
|
|
|
|
|
* <script src=foo.js></script>.
|
|
|
|
|
*
|
|
|
|
|
* @param $url string
|
|
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
|
|
|
|
public static function linkedScript( $url ) {
|
|
|
|
|
global $wgHtml5, $wgJsMimeType;
|
|
|
|
|
|
|
|
|
|
$attrs = array( 'src' => $url );
|
|
|
|
|
if ( !$wgHtml5 ) {
|
|
|
|
|
$attrs['type'] = $wgJsMimeType;
|
|
|
|
|
}
|
|
|
|
|
return self::element( 'script', $attrs );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Output a <style> tag with the given contents for the given media type
|
|
|
|
|
* (if any). TODO: do some useful escaping as well, like if $contents
|
|
|
|
|
* contains literal '</style>' (admittedly unlikely).
|
|
|
|
|
*
|
|
|
|
|
* @param $contents string CSS
|
2009-09-07 00:21:55 +00:00
|
|
|
* @param $media mixed A media type string, like 'screen'
|
2009-08-11 00:09:24 +00:00
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
2009-09-07 00:21:55 +00:00
|
|
|
public static function inlineStyle( $contents, $media = 'all' ) {
|
|
|
|
|
global $wgWellFormedXml;
|
2009-08-11 00:09:24 +00:00
|
|
|
|
2009-08-23 21:06:54 +00:00
|
|
|
if ( $wgWellFormedXml && preg_match( '/[<&]/', $contents ) ) {
|
|
|
|
|
$contents = "/*<![CDATA[*/$contents/*]]>*/";
|
|
|
|
|
}
|
2009-09-07 00:21:55 +00:00
|
|
|
return self::rawElement( 'style', array(
|
|
|
|
|
'type' => 'text/css',
|
|
|
|
|
'media' => $media,
|
|
|
|
|
), $contents );
|
2009-08-11 00:09:24 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Output a <link rel=stylesheet> linking to the given URL for the given
|
|
|
|
|
* media type (if any).
|
|
|
|
|
*
|
|
|
|
|
* @param $url string
|
2009-09-07 00:21:55 +00:00
|
|
|
* @param $media mixed A media type string, like 'screen'
|
2009-08-11 00:09:24 +00:00
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
2009-09-07 00:21:55 +00:00
|
|
|
public static function linkedStyle( $url, $media = 'all' ) {
|
|
|
|
|
return self::element( 'link', array(
|
|
|
|
|
'rel' => 'stylesheet',
|
|
|
|
|
'href' => $url,
|
|
|
|
|
'type' => 'text/css',
|
|
|
|
|
'media' => $media,
|
|
|
|
|
) );
|
2009-08-11 00:09:24 +00:00
|
|
|
}
|
2009-08-11 01:00:44 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Convenience function to produce an <input> element. This supports the
|
2009-12-30 07:08:52 +00:00
|
|
|
* new HTML5 input types and attributes, and will silently strip them if
|
2009-08-11 01:00:44 +00:00
|
|
|
* $wgHtml5 is false.
|
|
|
|
|
*
|
|
|
|
|
* @param $name string name attribute
|
2009-09-07 00:21:55 +00:00
|
|
|
* @param $value mixed value attribute
|
2009-08-11 01:00:44 +00:00
|
|
|
* @param $type string type attribute
|
2009-08-21 22:30:51 +00:00
|
|
|
* @param $attribs array Associative array of miscellaneous extra
|
|
|
|
|
* attributes, passed to Html::element()
|
2009-08-11 01:00:44 +00:00
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
2009-09-07 00:21:55 +00:00
|
|
|
public static function input( $name, $value = '', $type = 'text', $attribs = array() ) {
|
2009-09-06 15:07:52 +00:00
|
|
|
$attribs['type'] = $type;
|
2009-09-07 00:21:55 +00:00
|
|
|
$attribs['value'] = $value;
|
2009-08-11 01:00:44 +00:00
|
|
|
$attribs['name'] = $name;
|
|
|
|
|
|
|
|
|
|
return self::element( 'input', $attribs );
|
|
|
|
|
}
|
2009-08-21 21:57:26 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Convenience function to produce an input element with type=hidden, like
|
|
|
|
|
* Xml::hidden.
|
|
|
|
|
*
|
|
|
|
|
* @param $name string name attribute
|
|
|
|
|
* @param $value string value attribute
|
|
|
|
|
* @param $attribs array Associative array of miscellaneous extra
|
|
|
|
|
* attributes, passed to Html::element()
|
|
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
|
|
|
|
public static function hidden( $name, $value, $attribs = array() ) {
|
|
|
|
|
return self::input( $name, $value, 'hidden', $attribs );
|
|
|
|
|
}
|
2009-12-02 07:22:29 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Convenience function to produce an <input> element. This supports leaving
|
|
|
|
|
* out the cols= and rows= which Xml requires and are required by HTML4/XHTML
|
|
|
|
|
* but not required by HTML5 and will silently set cols="" and rows="" if
|
|
|
|
|
* $wgHtml5 is false and cols and rows are omitted (HTML4 validates present
|
|
|
|
|
* but empty cols="" and rows="" as valid).
|
|
|
|
|
*
|
|
|
|
|
* @param $name string name attribute
|
|
|
|
|
* @param $value string value attribute
|
|
|
|
|
* @param $attribs array Associative array of miscellaneous extra
|
|
|
|
|
* attributes, passed to Html::element()
|
|
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
|
|
|
|
public static function textarea( $name, $value = '', $attribs = array() ) {
|
|
|
|
|
global $wgHtml5;
|
|
|
|
|
$attribs['name'] = $name;
|
|
|
|
|
if ( !$wgHtml5 ) {
|
2010-01-27 19:14:18 +00:00
|
|
|
if ( !isset( $attribs['cols'] ) )
|
2009-12-02 07:22:29 +00:00
|
|
|
$attribs['cols'] = "";
|
2010-01-27 19:14:18 +00:00
|
|
|
if ( !isset( $attribs['rows'] ) )
|
2009-12-02 07:22:29 +00:00
|
|
|
$attribs['rows'] = "";
|
|
|
|
|
}
|
|
|
|
|
return self::element( 'textarea', $attribs, $value );
|
|
|
|
|
}
|
2010-05-08 13:45:14 +00:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Constructs the opening html-tag with necessary doctypes depending on
|
|
|
|
|
* global variables.
|
|
|
|
|
*
|
|
|
|
|
* @param $attribs array Associative array of miscellaneous extra
|
|
|
|
|
* attributes, passed to Html::element() of html tag.
|
|
|
|
|
* @return string Raw HTML
|
|
|
|
|
*/
|
|
|
|
|
public static function htmlHeader( $attribs = array() ) {
|
|
|
|
|
$ret = '';
|
|
|
|
|
|
|
|
|
|
global $wgMimeType, $wgOutputEncoding;
|
|
|
|
|
if ( self::isXmlMimeType( $wgMimeType ) ) {
|
|
|
|
|
$ret .= "<?xml version=\"1.0\" encoding=\"$wgOutputEncoding\" ?" . ">\n";
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
global $wgHtml5, $wgHtml5Version, $wgWellFormedXml, $wgDocType, $wgDTD;
|
|
|
|
|
global $wgXhtmlNamespaces, $wgXhtmlDefaultNamespace;
|
|
|
|
|
if ( $wgHtml5 ) {
|
|
|
|
|
if ( $wgWellFormedXml ) {
|
|
|
|
|
# Unknown elements and attributes are okay in XML, but unknown
|
|
|
|
|
# named entities are well-formedness errors and will break XML
|
|
|
|
|
# parsers. Thus we need a doctype that gives us appropriate
|
|
|
|
|
# entity definitions. The HTML5 spec permits four legacy
|
|
|
|
|
# doctypes as obsolete but conforming, so let's pick one of
|
|
|
|
|
# those, although it makes our pages look like XHTML1 Strict.
|
|
|
|
|
# Isn't compatibility great?
|
|
|
|
|
$ret .= "<!DOCTYPE html PUBLIC \"-//W3C//DTD XHTML 1.0 Strict//EN\" \"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd\">\n";
|
|
|
|
|
} else {
|
|
|
|
|
# Much saner.
|
|
|
|
|
$ret .= "<!doctype html>\n";
|
|
|
|
|
}
|
|
|
|
|
if ( $wgHtml5Version ) {
|
|
|
|
|
$attribs['version'] = $wgHtml5Version;
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
$ret .= "<!DOCTYPE html PUBLIC \"$wgDocType\" \"$wgDTD\">\n";
|
|
|
|
|
$attribs['xmlns'] = $wgXhtmlDefaultNamespace;
|
|
|
|
|
foreach ( $wgXhtmlNamespaces as $tag => $ns ) {
|
|
|
|
|
$attribs["xmlns:$tag"] = $ns;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return $ret . Html::openElement( 'html', $attribs ) . "\n";
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Determines if the given mime type is xml.
|
|
|
|
|
*
|
|
|
|
|
* @param $mimetype string MimeType
|
|
|
|
|
* @return Boolean
|
|
|
|
|
*/
|
|
|
|
|
public static function isXmlMimeType( $mimetype ) {
|
|
|
|
|
switch ( $mimetype ) {
|
|
|
|
|
case 'text/xml':
|
|
|
|
|
case 'application/xhtml+xml':
|
|
|
|
|
case 'application/xml':
|
|
|
|
|
return true;
|
|
|
|
|
default:
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
}
|
2009-08-11 00:09:24 +00:00
|
|
|
}
|