123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243 |
- <?php
- /**
- * Holder for stripped items when parsing wiki markup.
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
- * http://www.gnu.org/copyleft/gpl.html
- *
- * @file
- * @ingroup Parser
- */
- /**
- * @todo document, briefly.
- * @ingroup Parser
- */
- class StripState {
- protected $prefix;
- protected $data;
- protected $regex;
- protected $tempType, $tempMergePrefix;
- protected $circularRefGuard;
- protected $recursionLevel = 0;
- const UNSTRIP_RECURSION_LIMIT = 20;
- /**
- * @param string|null $prefix
- * @since 1.26 The prefix argument should be omitted, as the strip marker
- * prefix string is now a constant.
- */
- public function __construct( $prefix = null ) {
- if ( $prefix !== null ) {
- wfDeprecated( __METHOD__ . ' with called with $prefix argument' .
- ' (call with no arguments instead)', '1.26' );
- }
- $this->data = [
- 'nowiki' => [],
- 'general' => []
- ];
- $this->regex = '/' . Parser::MARKER_PREFIX . "([^\x7f<>&'\"]+)" . Parser::MARKER_SUFFIX . '/';
- $this->circularRefGuard = [];
- }
- /**
- * Add a nowiki strip item
- * @param string $marker
- * @param string $value
- */
- public function addNoWiki( $marker, $value ) {
- $this->addItem( 'nowiki', $marker, $value );
- }
- /**
- * @param string $marker
- * @param string $value
- */
- public function addGeneral( $marker, $value ) {
- $this->addItem( 'general', $marker, $value );
- }
- /**
- * @throws MWException
- * @param string $type
- * @param string $marker
- * @param string $value
- */
- protected function addItem( $type, $marker, $value ) {
- if ( !preg_match( $this->regex, $marker, $m ) ) {
- throw new MWException( "Invalid marker: $marker" );
- }
- $this->data[$type][$m[1]] = $value;
- }
- /**
- * @param string $text
- * @return mixed
- */
- public function unstripGeneral( $text ) {
- return $this->unstripType( 'general', $text );
- }
- /**
- * @param string $text
- * @return mixed
- */
- public function unstripNoWiki( $text ) {
- return $this->unstripType( 'nowiki', $text );
- }
- /**
- * @param string $text
- * @return mixed
- */
- public function unstripBoth( $text ) {
- $text = $this->unstripType( 'general', $text );
- $text = $this->unstripType( 'nowiki', $text );
- return $text;
- }
- /**
- * @param string $type
- * @param string $text
- * @return mixed
- */
- protected function unstripType( $type, $text ) {
- // Shortcut
- if ( !count( $this->data[$type] ) ) {
- return $text;
- }
- $oldType = $this->tempType;
- $this->tempType = $type;
- $text = preg_replace_callback( $this->regex, [ $this, 'unstripCallback' ], $text );
- $this->tempType = $oldType;
- return $text;
- }
- /**
- * @param array $m
- * @return array
- */
- protected function unstripCallback( $m ) {
- $marker = $m[1];
- if ( isset( $this->data[$this->tempType][$marker] ) ) {
- if ( isset( $this->circularRefGuard[$marker] ) ) {
- return '<span class="error">'
- . wfMessage( 'parser-unstrip-loop-warning' )->inContentLanguage()->text()
- . '</span>';
- }
- if ( $this->recursionLevel >= self::UNSTRIP_RECURSION_LIMIT ) {
- return '<span class="error">' .
- wfMessage( 'parser-unstrip-recursion-limit' )
- ->numParams( self::UNSTRIP_RECURSION_LIMIT )->inContentLanguage()->text() .
- '</span>';
- }
- $this->circularRefGuard[$marker] = true;
- $this->recursionLevel++;
- $value = $this->data[$this->tempType][$marker];
- if ( $value instanceof Closure ) {
- $value = $value();
- }
- $ret = $this->unstripType( $this->tempType, $value );
- $this->recursionLevel--;
- unset( $this->circularRefGuard[$marker] );
- return $ret;
- } else {
- return $m[0];
- }
- }
- /**
- * Get a StripState object which is sufficient to unstrip the given text.
- * It will contain the minimum subset of strip items necessary.
- *
- * @param string $text
- *
- * @return StripState
- */
- public function getSubState( $text ) {
- $subState = new StripState();
- $pos = 0;
- while ( true ) {
- $startPos = strpos( $text, Parser::MARKER_PREFIX, $pos );
- $endPos = strpos( $text, Parser::MARKER_SUFFIX, $pos );
- if ( $startPos === false || $endPos === false ) {
- break;
- }
- $endPos += strlen( Parser::MARKER_SUFFIX );
- $marker = substr( $text, $startPos, $endPos - $startPos );
- if ( !preg_match( $this->regex, $marker, $m ) ) {
- continue;
- }
- $key = $m[1];
- if ( isset( $this->data['nowiki'][$key] ) ) {
- $subState->data['nowiki'][$key] = $this->data['nowiki'][$key];
- } elseif ( isset( $this->data['general'][$key] ) ) {
- $subState->data['general'][$key] = $this->data['general'][$key];
- }
- $pos = $endPos;
- }
- return $subState;
- }
- /**
- * Merge another StripState object into this one. The strip marker keys
- * will not be preserved. The strings in the $texts array will have their
- * strip markers rewritten, the resulting array of strings will be returned.
- *
- * @param StripState $otherState
- * @param array $texts
- * @return array
- */
- public function merge( $otherState, $texts ) {
- $mergePrefix = wfRandomString( 16 );
- foreach ( $otherState->data as $type => $items ) {
- foreach ( $items as $key => $value ) {
- $this->data[$type]["$mergePrefix-$key"] = $value;
- }
- }
- $this->tempMergePrefix = $mergePrefix;
- $texts = preg_replace_callback( $otherState->regex, [ $this, 'mergeCallback' ], $texts );
- $this->tempMergePrefix = null;
- return $texts;
- }
- /**
- * @param array $m
- * @return string
- */
- protected function mergeCallback( $m ) {
- $key = $m[1];
- return Parser::MARKER_PREFIX . $this->tempMergePrefix . '-' . $key . Parser::MARKER_SUFFIX;
- }
- /**
- * Remove any strip markers found in the given text.
- *
- * @param string $text Input string
- * @return string
- */
- public function killMarkers( $text ) {
- return preg_replace( $this->regex, '', $text );
- }
- }
|