123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495 |
- <?php
- /**
- * Basic support for outputting syndication feeds in RSS, other formats.
- *
- * Contain a feed class as well as classes to build rss / atom ... feeds
- * Available feeds are defined in Defines.php
- *
- * Copyright © 2004 Brion Vibber <brion@pobox.com>
- * https://www.mediawiki.org/
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
- * http://www.gnu.org/copyleft/gpl.html
- *
- * @file
- */
- /**
- * @defgroup Feed Feed
- */
- /**
- * A base class for basic support for outputting syndication feeds in RSS and other formats.
- *
- * @ingroup Feed
- */
- class FeedItem {
- /** @var Title */
- public $title;
- public $description;
- public $url;
- public $date;
- public $author;
- public $uniqueId;
- public $comments;
- public $rssIsPermalink = false;
- /**
- * @param string|Title $title Item's title
- * @param string $description
- * @param string $url URL uniquely designating the item.
- * @param string $date Item's date
- * @param string $author Author's user name
- * @param string $comments
- */
- function __construct( $title, $description, $url, $date = '', $author = '', $comments = '' ) {
- $this->title = $title;
- $this->description = $description;
- $this->url = $url;
- $this->uniqueId = $url;
- $this->date = $date;
- $this->author = $author;
- $this->comments = $comments;
- }
- /**
- * Encode $string so that it can be safely embedded in a XML document
- *
- * @param string $string String to encode
- * @return string
- */
- public function xmlEncode( $string ) {
- $string = str_replace( "\r\n", "\n", $string );
- $string = preg_replace( '/[\x00-\x08\x0b\x0c\x0e-\x1f]/', '', $string );
- return htmlspecialchars( $string );
- }
- /**
- * Get the unique id of this item; already xml-encoded
- * @return string
- */
- public function getUniqueID() {
- $id = $this->getUniqueIdUnescaped();
- if ( $id ) {
- return $this->xmlEncode( $id );
- }
- }
- /**
- * Get the unique id of this item, without any escaping
- * @return string
- */
- public function getUniqueIdUnescaped() {
- if ( $this->uniqueId ) {
- return wfExpandUrl( $this->uniqueId, PROTO_CURRENT );
- }
- }
- /**
- * Set the unique id of an item
- *
- * @param string $uniqueId Unique id for the item
- * @param bool $rssIsPermalink Set to true if the guid (unique id) is a permalink (RSS feeds only)
- */
- public function setUniqueId( $uniqueId, $rssIsPermalink = false ) {
- $this->uniqueId = $uniqueId;
- $this->rssIsPermalink = $rssIsPermalink;
- }
- /**
- * Get the title of this item; already xml-encoded
- *
- * @return string
- */
- public function getTitle() {
- return $this->xmlEncode( $this->title );
- }
- /**
- * Get the URL of this item; already xml-encoded
- *
- * @return string
- */
- public function getUrl() {
- return $this->xmlEncode( $this->url );
- }
- /** Get the URL of this item without any escaping
- *
- * @return string
- */
- public function getUrlUnescaped() {
- return $this->url;
- }
- /**
- * Get the description of this item; already xml-encoded
- *
- * @return string
- */
- public function getDescription() {
- return $this->xmlEncode( $this->description );
- }
- /**
- * Get the description of this item without any escaping
- *
- * @return string
- */
- public function getDescriptionUnescaped() {
- return $this->description;
- }
- /**
- * Get the language of this item
- *
- * @return string
- */
- public function getLanguage() {
- global $wgLanguageCode;
- return LanguageCode::bcp47( $wgLanguageCode );
- }
- /**
- * Get the date of this item
- *
- * @return string
- */
- public function getDate() {
- return $this->date;
- }
- /**
- * Get the author of this item; already xml-encoded
- *
- * @return string
- */
- public function getAuthor() {
- return $this->xmlEncode( $this->author );
- }
- /**
- * Get the author of this item without any escaping
- *
- * @return string
- */
- public function getAuthorUnescaped() {
- return $this->author;
- }
- /**
- * Get the comment of this item; already xml-encoded
- *
- * @return string
- */
- public function getComments() {
- return $this->xmlEncode( $this->comments );
- }
- /**
- * Get the comment of this item without any escaping
- *
- * @return string
- */
- public function getCommentsUnescaped() {
- return $this->comments;
- }
- /**
- * Quickie hack... strip out wikilinks to more legible form from the comment.
- *
- * @param string $text Wikitext
- * @return string
- */
- public static function stripComment( $text ) {
- return preg_replace( '/\[\[([^]]*\|)?([^]]+)\]\]/', '\2', $text );
- }
- /**#@-*/
- }
- /**
- * Class to support the outputting of syndication feeds in Atom and RSS format.
- *
- * @ingroup Feed
- */
- abstract class ChannelFeed extends FeedItem {
- /** @var TemplateParser */
- protected $templateParser;
- /**
- * @param string|Title $title Feed's title
- * @param string $description
- * @param string $url URL uniquely designating the feed.
- * @param string $date Feed's date
- * @param string $author Author's user name
- * @param string $comments
- */
- function __construct( $title, $description, $url, $date = '', $author = '', $comments = '' ) {
- parent::__construct( $title, $description, $url, $date, $author, $comments );
- $this->templateParser = new TemplateParser();
- }
- /**
- * Generate Header of the feed
- * @par Example:
- * @code
- * print "<feed>";
- * @endcode
- */
- abstract public function outHeader();
- /**
- * Generate an item
- * @par Example:
- * @code
- * print "<item>...</item>";
- * @endcode
- * @param FeedItem $item
- */
- abstract public function outItem( $item );
- /**
- * Generate Footer of the feed
- * @par Example:
- * @code
- * print "</feed>";
- * @endcode
- */
- abstract public function outFooter();
- /**
- * Setup and send HTTP headers. Don't send any content;
- * content might end up being cached and re-sent with
- * these same headers later.
- *
- * This should be called from the outHeader() method,
- * but can also be called separately.
- */
- public function httpHeaders() {
- global $wgOut, $wgVaryOnXFP;
- # We take over from $wgOut, excepting its cache header info
- $wgOut->disable();
- $mimetype = $this->contentType();
- header( "Content-type: $mimetype; charset=UTF-8" );
- // Set a sane filename
- $exts = MediaWiki\MediaWikiServices::getInstance()->getMimeAnalyzer()
- ->getExtensionsForType( $mimetype );
- $ext = $exts ? strtok( $exts, ' ' ) : 'xml';
- header( "Content-Disposition: inline; filename=\"feed.{$ext}\"" );
- if ( $wgVaryOnXFP ) {
- $wgOut->addVaryHeader( 'X-Forwarded-Proto' );
- }
- $wgOut->sendCacheControl();
- }
- /**
- * Return an internet media type to be sent in the headers.
- *
- * @return string
- */
- private function contentType() {
- global $wgRequest;
- $ctype = $wgRequest->getVal( 'ctype', 'application/xml' );
- $allowedctypes = [
- 'application/xml',
- 'text/xml',
- 'application/rss+xml',
- 'application/atom+xml'
- ];
- return ( in_array( $ctype, $allowedctypes ) ? $ctype : 'application/xml' );
- }
- /**
- * Output the initial XML headers.
- */
- protected function outXmlHeader() {
- $this->httpHeaders();
- echo '<?xml version="1.0"?>' . "\n";
- }
- }
- /**
- * Generate a RSS feed
- *
- * @ingroup Feed
- */
- class RSSFeed extends ChannelFeed {
- /**
- * Format a date given a timestamp. If a timestamp is not given, nothing is returned
- *
- * @param int|null $ts Timestamp
- * @return string|null Date string
- */
- function formatTime( $ts ) {
- if ( $ts ) {
- return gmdate( 'D, d M Y H:i:s \G\M\T', wfTimestamp( TS_UNIX, $ts ) );
- }
- }
- /**
- * Output an RSS 2.0 header
- */
- function outHeader() {
- global $wgVersion;
- $this->outXmlHeader();
- // Manually escaping rather than letting Mustache do it because Mustache
- // uses htmlentities, which does not work with XML
- $templateParams = [
- 'title' => $this->getTitle(),
- 'url' => $this->xmlEncode( wfExpandUrl( $this->getUrlUnescaped(), PROTO_CURRENT ) ),
- 'description' => $this->getDescription(),
- 'language' => $this->xmlEncode( $this->getLanguage() ),
- 'version' => $this->xmlEncode( $wgVersion ),
- 'timestamp' => $this->xmlEncode( $this->formatTime( wfTimestampNow() ) )
- ];
- print $this->templateParser->processTemplate( 'RSSHeader', $templateParams );
- }
- /**
- * Output an RSS 2.0 item
- * @param FeedItem $item Item to be output
- */
- function outItem( $item ) {
- // Manually escaping rather than letting Mustache do it because Mustache
- // uses htmlentities, which does not work with XML
- $templateParams = [
- "title" => $item->getTitle(),
- "url" => $this->xmlEncode( wfExpandUrl( $item->getUrlUnescaped(), PROTO_CURRENT ) ),
- "permalink" => $item->rssIsPermalink,
- "uniqueID" => $item->getUniqueID(),
- "description" => $item->getDescription(),
- "date" => $this->xmlEncode( $this->formatTime( $item->getDate() ) ),
- "author" => $item->getAuthor()
- ];
- $comments = $item->getCommentsUnescaped();
- if ( $comments ) {
- $commentsEscaped = $this->xmlEncode( wfExpandUrl( $comments, PROTO_CURRENT ) );
- $templateParams["comments"] = $commentsEscaped;
- }
- print $this->templateParser->processTemplate( 'RSSItem', $templateParams );
- }
- /**
- * Output an RSS 2.0 footer
- */
- function outFooter() {
- print "</channel></rss>";
- }
- }
- /**
- * Generate an Atom feed
- *
- * @ingroup Feed
- */
- class AtomFeed extends ChannelFeed {
- /**
- * Format a date given timestamp, if one is given.
- *
- * @param string|int|null $timestamp
- * @return string|null
- */
- function formatTime( $timestamp ) {
- if ( $timestamp ) {
- // need to use RFC 822 time format at least for rss2.0
- return gmdate( 'Y-m-d\TH:i:s', wfTimestamp( TS_UNIX, $timestamp ) );
- }
- }
- /**
- * Outputs a basic header for Atom 1.0 feeds.
- */
- function outHeader() {
- global $wgVersion;
- $this->outXmlHeader();
- // Manually escaping rather than letting Mustache do it because Mustache
- // uses htmlentities, which does not work with XML
- $templateParams = [
- 'language' => $this->xmlEncode( $this->getLanguage() ),
- 'feedID' => $this->getFeedId(),
- 'title' => $this->getTitle(),
- 'url' => $this->xmlEncode( wfExpandUrl( $this->getUrlUnescaped(), PROTO_CURRENT ) ),
- 'selfUrl' => $this->getSelfUrl(),
- 'timestamp' => $this->xmlEncode( $this->formatTime( wfTimestampNow() ) ),
- 'description' => $this->getDescription(),
- 'version' => $this->xmlEncode( $wgVersion ),
- ];
- print $this->templateParser->processTemplate( 'AtomHeader', $templateParams );
- }
- /**
- * Atom 1.0 requires a unique, opaque IRI as a unique identifier
- * for every feed we create. For now just use the URL, but who
- * can tell if that's right? If we put options on the feed, do we
- * have to change the id? Maybe? Maybe not.
- *
- * @return string
- */
- private function getFeedId() {
- return $this->getSelfUrl();
- }
- /**
- * Atom 1.0 requests a self-reference to the feed.
- * @return string
- */
- private function getSelfUrl() {
- global $wgRequest;
- return htmlspecialchars( $wgRequest->getFullRequestURL() );
- }
- /**
- * Output a given item.
- * @param FeedItem $item
- */
- function outItem( $item ) {
- global $wgMimeType;
- // Manually escaping rather than letting Mustache do it because Mustache
- // uses htmlentities, which does not work with XML
- $templateParams = [
- "uniqueID" => $item->getUniqueID(),
- "title" => $item->getTitle(),
- "mimeType" => $this->xmlEncode( $wgMimeType ),
- "url" => $this->xmlEncode( wfExpandUrl( $item->getUrlUnescaped(), PROTO_CURRENT ) ),
- "date" => $this->xmlEncode( $this->formatTime( $item->getDate() ) ),
- "description" => $item->getDescription(),
- "author" => $item->getAuthor()
- ];
- print $this->templateParser->processTemplate( 'AtomItem', $templateParams );
- }
- /**
- * Outputs the footer for Atom 1.0 feed (basically '\</feed\>').
- */
- function outFooter() {
- print "</feed>";
- }
- }
|