2007-07-19 10:40:28 +00:00
|
|
|
<?php
|
|
|
|
/**
|
2015-11-14 11:44:49 +13:00
|
|
|
* The content negotiator performs "text/html" or "application/xhtml+xml" switching. It does this through
|
|
|
|
* the public static function ContentNegotiator::process(). By default, ContentNegotiator will comply to
|
|
|
|
* the Accept headers the clients sends along with the HTTP request, which is most likely
|
|
|
|
* "application/xhtml+xml" (see "Order of selection" below).
|
2008-09-16 14:29:00 +00:00
|
|
|
*
|
|
|
|
* Order of selection between html or xhtml is as follows:
|
2015-11-14 11:44:49 +13:00
|
|
|
* - if PHP has already sent the HTTP headers, default to "html" (we can't send HTTP Content-Type headers
|
|
|
|
* any longer)
|
2008-09-16 14:29:00 +00:00
|
|
|
* - if a GET variable ?forceFormat is set, it takes precedence (for testing purposes)
|
|
|
|
* - if the user agent is detected as W3C Validator we always deliver "xhtml"
|
|
|
|
* - if an HTTP Accept header is sent from the client, we respect its order (this is the most common case)
|
|
|
|
* - if none of the above matches, fallback is "html"
|
2014-08-15 18:53:05 +12:00
|
|
|
*
|
2015-11-14 11:44:49 +13:00
|
|
|
* ContentNegotiator doesn't enable you to send content as a true XML document through the "text/xml"
|
|
|
|
* or "application/xhtml+xml" Content-Type.
|
|
|
|
*
|
2008-09-16 14:29:00 +00:00
|
|
|
* Please see http://webkit.org/blog/68/understanding-html-xml-and-xhtml/ for further information.
|
2014-08-15 18:53:05 +12:00
|
|
|
*
|
2012-04-12 18:02:46 +12:00
|
|
|
* @package framework
|
2015-11-14 11:44:49 +13:00
|
|
|
*
|
2008-02-25 02:10:37 +00:00
|
|
|
* @subpackage control
|
2014-08-15 18:53:05 +12:00
|
|
|
*
|
2008-09-16 14:29:00 +00:00
|
|
|
* @todo Check for correct XHTML doctype in xhtml()
|
|
|
|
* @todo Allow for other HTML4 doctypes (e.g. Transitional) in html()
|
2015-11-14 11:44:49 +13:00
|
|
|
* @todo Make content replacement and doctype setting two separately configurable behaviours
|
|
|
|
*
|
|
|
|
* Some developers might know what they're doing and don't want ContentNegotiator messing with their
|
|
|
|
* HTML4 doctypes, but still find it useful to have self-closing tags removed.
|
2007-07-19 10:40:28 +00:00
|
|
|
*/
|
2013-03-21 19:48:54 +01:00
|
|
|
class ContentNegotiator extends Object {
|
2009-11-26 22:12:40 +00:00
|
|
|
|
2013-03-21 19:48:54 +01:00
|
|
|
/**
|
|
|
|
* @config
|
2015-11-14 11:44:49 +13:00
|
|
|
*
|
2013-03-21 19:48:54 +01:00
|
|
|
* @var string
|
|
|
|
*/
|
|
|
|
private static $content_type = '';
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2013-03-21 19:48:54 +01:00
|
|
|
/**
|
|
|
|
* @config
|
2015-11-14 11:44:49 +13:00
|
|
|
*
|
2013-03-21 19:48:54 +01:00
|
|
|
* @var string
|
|
|
|
*/
|
|
|
|
private static $encoding = 'utf-8';
|
2009-11-26 22:12:40 +00:00
|
|
|
|
2013-03-21 19:48:54 +01:00
|
|
|
/**
|
|
|
|
* @config
|
2015-11-14 11:44:49 +13:00
|
|
|
*
|
|
|
|
* @var bool
|
2013-03-21 19:48:54 +01:00
|
|
|
*/
|
|
|
|
private static $enabled = false;
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2013-05-13 10:57:23 +02:00
|
|
|
/**
|
|
|
|
* @config
|
2015-11-14 11:44:49 +13:00
|
|
|
*
|
2013-05-13 10:57:23 +02:00
|
|
|
* @var string
|
|
|
|
*/
|
|
|
|
private static $default_format = 'html';
|
2009-11-26 22:12:40 +00:00
|
|
|
|
2007-07-19 10:40:28 +00:00
|
|
|
/**
|
2015-11-14 11:44:49 +13:00
|
|
|
* Set the character set encoding for this page. By default it's utf-8, but you could change it to,
|
|
|
|
* say, windows-1252, to improve interoperability with extended characters being imported from windows
|
|
|
|
* excel.
|
2013-03-21 19:48:54 +01:00
|
|
|
*
|
2015-06-19 11:59:27 +12:00
|
|
|
* @deprecated 4.0 Use the "ContentNegotiator.encoding" config setting instead
|
2015-11-14 11:44:49 +13:00
|
|
|
*
|
|
|
|
* @param string $encoding
|
2007-07-19 10:40:28 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public static function set_encoding($encoding) {
|
2015-06-19 11:59:27 +12:00
|
|
|
Deprecation::notice('4.0', 'Use the "ContentNegotiator.encoding" config setting instead');
|
2013-03-21 19:48:54 +01:00
|
|
|
Config::inst()->update('ContentNegotiator', 'encoding', $encoding);
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
2009-11-26 22:16:02 +00:00
|
|
|
|
2007-07-19 10:40:28 +00:00
|
|
|
/**
|
2015-11-14 11:44:49 +13:00
|
|
|
* Return the character encoding set bhy ContentNegotiator::set_encoding(). It's recommended that all
|
|
|
|
* classes that need to specify the character set make use of this function.
|
2013-03-21 19:48:54 +01:00
|
|
|
*
|
2015-11-14 11:44:49 +13:00
|
|
|
* @deprecated 4.0 Use the "ContentNegotiator.encoding" config setting instead.
|
|
|
|
*
|
|
|
|
* @return string
|
2007-07-19 10:40:28 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public static function get_encoding() {
|
2015-06-19 11:59:27 +12:00
|
|
|
Deprecation::notice('4.0', 'Use the "ContentNegotiator.encoding" config setting instead');
|
2013-03-21 19:48:54 +01:00
|
|
|
return Config::inst()->get('ContentNegotiator', 'encoding');
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
2009-11-26 22:16:02 +00:00
|
|
|
|
|
|
|
/**
|
|
|
|
* Enable content negotiation for all templates, not just those with the xml header.
|
2013-03-21 19:48:54 +01:00
|
|
|
*
|
2015-06-19 11:59:27 +12:00
|
|
|
* @deprecated 4.0 Use the "ContentNegotiator.enabled" config setting instead
|
2009-11-26 22:16:02 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public static function enable() {
|
2015-06-19 11:59:27 +12:00
|
|
|
Deprecation::notice('4.0', 'Use the "ContentNegotiator.enabled" config setting instead');
|
2013-03-21 19:48:54 +01:00
|
|
|
Config::inst()->update('ContentNegotiator', 'enabled', true);
|
2009-11-26 22:16:02 +00:00
|
|
|
}
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2013-03-21 19:48:54 +01:00
|
|
|
/**
|
2010-10-13 01:07:35 +00:00
|
|
|
* Disable content negotiation for all templates, not just those with the xml header.
|
2013-03-21 19:48:54 +01:00
|
|
|
*
|
2015-06-19 11:59:27 +12:00
|
|
|
* @deprecated 4.0 Use the "ContentNegotiator.enabled" config setting instead
|
2010-10-13 01:07:35 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public static function disable() {
|
2015-06-19 11:59:27 +12:00
|
|
|
Deprecation::notice('4.0', 'Use the "ContentNegotiator.enabled" config setting instead');
|
2013-03-21 19:48:54 +01:00
|
|
|
Config::inst()->update('ContentNegotiator', 'enabled', false);
|
2010-10-13 01:07:35 +00:00
|
|
|
}
|
2009-11-26 22:16:02 +00:00
|
|
|
|
|
|
|
/**
|
2015-11-14 11:44:49 +13:00
|
|
|
* Returns true if negotiation is enabled for the given response. By default, negotiation is only
|
|
|
|
* enabled for pages that have the xml header.
|
2009-11-26 22:16:02 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public static function enabled_for($response) {
|
2009-11-26 22:16:02 +00:00
|
|
|
$contentType = $response->getHeader("Content-Type");
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2015-11-14 11:44:49 +13:00
|
|
|
// Disable content negotiation for other content types
|
2014-08-15 18:53:05 +12:00
|
|
|
if($contentType && substr($contentType, 0,9) != 'text/html'
|
2012-09-27 09:34:00 +12:00
|
|
|
&& substr($contentType, 0,21) != 'application/xhtml+xml') {
|
|
|
|
return false;
|
|
|
|
}
|
2009-11-26 22:16:02 +00:00
|
|
|
|
2013-03-21 19:48:54 +01:00
|
|
|
if(Config::inst()->get('ContentNegotiator', 'enabled')) return true;
|
2009-11-26 22:16:02 +00:00
|
|
|
else return (substr($response->getBody(),0,5) == '<' . '?xml');
|
|
|
|
}
|
|
|
|
|
2015-11-14 11:44:49 +13:00
|
|
|
/**
|
|
|
|
* @param SS_HTTPResponse $response
|
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public static function process(SS_HTTPResponse $response) {
|
2009-01-05 06:19:48 +00:00
|
|
|
if(!self::enabled_for($response)) return;
|
2007-07-19 10:40:28 +00:00
|
|
|
|
|
|
|
$mimes = array(
|
|
|
|
"xhtml" => "application/xhtml+xml",
|
|
|
|
"html" => "text/html",
|
|
|
|
);
|
|
|
|
$q = array();
|
|
|
|
if(headers_sent()) {
|
2013-05-13 10:57:23 +02:00
|
|
|
$chosenFormat = Config::inst()->get('ContentNegotiator', 'default_format');
|
2007-07-19 10:40:28 +00:00
|
|
|
|
|
|
|
} else if(isset($_GET['forceFormat'])) {
|
|
|
|
$chosenFormat = $_GET['forceFormat'];
|
|
|
|
|
|
|
|
} else {
|
2015-11-14 11:44:49 +13:00
|
|
|
// The W3C validator doesn't send an HTTP_ACCEPT header, but it can support xhtml. We put this
|
|
|
|
// special case in here so that designers don't get worried that their templates are HTML4.
|
2012-12-09 00:20:20 +13:00
|
|
|
if(isset($_SERVER['HTTP_USER_AGENT']) && substr($_SERVER['HTTP_USER_AGENT'], 0, 14) == 'W3C_Validator/') {
|
2008-02-25 02:10:37 +00:00
|
|
|
$chosenFormat = "xhtml";
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2008-02-25 02:10:37 +00:00
|
|
|
} else {
|
|
|
|
foreach($mimes as $format => $mime) {
|
|
|
|
$regExp = '/' . str_replace(array('+','/'),array('\+','\/'), $mime) . '(;q=(\d+\.\d+))?/i';
|
|
|
|
if (isset($_SERVER['HTTP_ACCEPT']) && preg_match($regExp, $_SERVER['HTTP_ACCEPT'], $matches)) {
|
|
|
|
$preference = isset($matches[2]) ? $matches[2] : 1;
|
|
|
|
if(!isset($q[$preference])) $q[$preference] = $format;
|
|
|
|
}
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
|
|
|
|
2008-02-25 02:10:37 +00:00
|
|
|
if($q) {
|
|
|
|
// Get the preferred format
|
|
|
|
krsort($q);
|
|
|
|
$chosenFormat = reset($q);
|
|
|
|
} else {
|
2013-05-13 10:57:23 +02:00
|
|
|
$chosenFormat = Config::inst()->get('ContentNegotiator', 'default_format');
|
2008-02-25 02:10:37 +00:00
|
|
|
}
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$negotiator = new ContentNegotiator();
|
2007-08-17 03:09:46 +00:00
|
|
|
$negotiator->$chosenFormat( $response );
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
|
|
|
|
2014-08-15 18:53:05 +12:00
|
|
|
/**
|
2013-03-11 11:40:42 +01:00
|
|
|
* Check user defined content type and use it, if it's empty use the strict application/xhtml+xml.
|
|
|
|
* Replaces a few common tags and entities with their XHTML representations (<br>, <img>,
|
|
|
|
* <input>, checked, selected).
|
2008-09-16 14:29:00 +00:00
|
|
|
*
|
2015-11-14 11:44:49 +13:00
|
|
|
* @param SS_HTTPResponse $response
|
|
|
|
*
|
2013-03-11 11:40:42 +01:00
|
|
|
* @todo Search for more xhtml replacement
|
2008-09-16 14:29:00 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public function xhtml(SS_HTTPResponse $response) {
|
2007-08-17 03:09:46 +00:00
|
|
|
$content = $response->getBody();
|
2013-03-21 19:48:54 +01:00
|
|
|
$encoding = Config::inst()->get('ContentNegotiator', 'encoding');
|
2007-07-19 10:40:28 +00:00
|
|
|
|
2013-03-11 11:40:42 +01:00
|
|
|
$contentType = Config::inst()->get('ContentNegotiator', 'content_type');
|
|
|
|
if (empty($contentType)) {
|
2013-03-21 19:48:54 +01:00
|
|
|
$response->addHeader("Content-Type", "application/xhtml+xml; charset=" . $encoding);
|
2013-03-11 11:40:42 +01:00
|
|
|
} else {
|
2013-03-21 19:48:54 +01:00
|
|
|
$response->addHeader("Content-Type", $contentType . "; charset=" . $encoding);
|
2013-03-11 11:40:42 +01:00
|
|
|
}
|
2013-03-07 11:35:24 +01:00
|
|
|
$response->addHeader("Vary" , "Accept");
|
|
|
|
|
|
|
|
// Fix base tag
|
2014-08-15 18:53:05 +12:00
|
|
|
$content = preg_replace('/<base href="([^"]*)"><!--\[if[[^\]*]\] \/><!\[endif\]-->/',
|
2013-03-07 11:35:24 +01:00
|
|
|
'<base href="$1" />', $content);
|
|
|
|
|
|
|
|
$content = str_replace(' ',' ', $content);
|
|
|
|
$content = str_replace('<br>','<br />', $content);
|
2013-03-08 10:42:32 +01:00
|
|
|
$content = str_replace('<hr>','<hr />', $content);
|
2013-03-07 11:35:24 +01:00
|
|
|
$content = preg_replace('#(<img[^>]*[^/>])>#i', '\\1/>', $content);
|
2013-03-11 11:40:42 +01:00
|
|
|
$content = preg_replace('#(<input[^>]*[^/>])>#i', '\\1/>', $content);
|
2013-09-19 17:30:36 +02:00
|
|
|
$content = preg_replace('#(<param[^>]*[^/>])>#i', '\\1/>', $content);
|
2013-03-11 11:40:42 +01:00
|
|
|
$content = preg_replace("#(\<option[^>]*[\s]+selected)(?!\s*\=)#si", "$1=\"selected\"$2", $content);
|
|
|
|
$content = preg_replace("#(\<input[^>]*[\s]+checked)(?!\s*\=)#si", "$1=\"checked\"$2", $content);
|
2013-03-07 11:35:24 +01:00
|
|
|
|
|
|
|
$response->setBody($content);
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2015-11-14 11:44:49 +13:00
|
|
|
/**
|
|
|
|
* Performs the following replacements:
|
|
|
|
* - Check user defined content type and use it, if it's empty use the text/html.
|
|
|
|
* - If find a XML header replaces it and existing doctypes with HTML4.01 Strict.
|
|
|
|
* - Replaces self-closing tags like <img /> with unclosed solitary tags like <img>.
|
|
|
|
* - Replaces all occurrences of "application/xhtml+xml" with "text/html" in the template.
|
|
|
|
* - Removes "xmlns" attributes and any <?xml> Pragmas.
|
|
|
|
*
|
|
|
|
* @param SS_HTTPResponse $response
|
2008-09-16 14:29:00 +00:00
|
|
|
*/
|
2012-09-19 12:07:39 +02:00
|
|
|
public function html(SS_HTTPResponse $response) {
|
2013-03-21 19:48:54 +01:00
|
|
|
$encoding = Config::inst()->get('ContentNegotiator', 'encoding');
|
2013-03-11 11:40:42 +01:00
|
|
|
$contentType = Config::inst()->get('ContentNegotiator', 'content_type');
|
|
|
|
if (empty($contentType)) {
|
2013-03-21 19:48:54 +01:00
|
|
|
$response->addHeader("Content-Type", "text/html; charset=" . $encoding);
|
2013-03-11 11:40:42 +01:00
|
|
|
} else {
|
2013-03-21 19:48:54 +01:00
|
|
|
$response->addHeader("Content-Type", $contentType . "; charset=" . $encoding);
|
2013-03-11 11:40:42 +01:00
|
|
|
}
|
2007-08-17 03:09:46 +00:00
|
|
|
$response->addHeader("Vary", "Accept");
|
|
|
|
|
|
|
|
$content = $response->getBody();
|
2009-01-05 06:19:48 +00:00
|
|
|
$hasXMLHeader = (substr($content,0,5) == '<' . '?xml' );
|
2007-07-19 10:40:28 +00:00
|
|
|
|
2009-10-31 00:16:54 +00:00
|
|
|
// Fix base tag
|
2014-08-15 18:53:05 +12:00
|
|
|
$content = preg_replace('/<base href="([^"]*)" \/>/',
|
2009-10-31 00:16:54 +00:00
|
|
|
'<base href="$1"><!--[if lte IE 6]></base><![endif]-->', $content);
|
|
|
|
|
2012-02-27 22:14:02 +01:00
|
|
|
$content = preg_replace("#<\\?xml[^>]+\\?>\n?#", '', $content);
|
2007-07-19 10:40:28 +00:00
|
|
|
$content = str_replace(array('/>','xml:lang','application/xhtml+xml'),array('>','lang','text/html'), $content);
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2009-01-05 06:19:48 +00:00
|
|
|
// Only replace the doctype in templates with the xml header
|
|
|
|
if($hasXMLHeader) {
|
2012-09-27 09:34:00 +12:00
|
|
|
$content = preg_replace('/<!DOCTYPE[^>]+>/',
|
|
|
|
'<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN" "http://www.w3.org/TR/html4/strict.dtd">',
|
|
|
|
$content);
|
2009-01-05 06:19:48 +00:00
|
|
|
}
|
2012-02-27 22:14:02 +01:00
|
|
|
$content = preg_replace('/<html xmlns="[^"]+"/','<html ', $content);
|
2014-08-15 18:53:05 +12:00
|
|
|
|
2007-08-17 03:09:46 +00:00
|
|
|
$response->setBody($content);
|
2007-07-19 10:40:28 +00:00
|
|
|
}
|
2009-11-27 01:43:14 +00:00
|
|
|
|
|
|
|
}
|