[ Index ]

PHP Cross Reference of BackPress




/includes/ -> functions.kses.php (source)

   1  <?php
   2  // Last sync [WP17185]
   4  /**
   5   * kses 0.2.2 - HTML/XHTML filter that only allows some elements and attributes
   6   * Copyright (C) 2002, 2003, 2005  Ulf Harnhammar
   7   *
   8   * This program is free software and open source software; you can redistribute
   9   * it and/or modify it under the terms of the GNU General Public License as
  10   * published by the Free Software Foundation; either version 2 of the License,
  11   * or (at your option) any later version.
  12   *
  13   * This program is distributed in the hope that it will be useful, but WITHOUT
  14   * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  15   * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License for
  16   * more details.
  17   *
  18   * You should have received a copy of the GNU General Public License along
  19   * with this program; if not, write to the Free Software Foundation, Inc.,
  20   * 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA  or visit
  21   * http://www.gnu.org/licenses/gpl.html
  22   * 
  23   * [kses strips evil scripts!]
  24   *
  25   * Added wp_ prefix to avoid conflicts with existing kses users
  26   *
  27   * @version 0.2.2
  28   * @copyright (C) 2002, 2003, 2005
  29   * @author Ulf Harnhammar <http://advogato.org/person/metaur/>
  30   *
  31   * @package External
  32   * @subpackage KSES
  33   *
  34   */
  36  /**
  37   * You can override this in a plugin.
  38   *
  39   * @since 1.2.0
  40   */
  41  if ( ! defined( 'BP_CUSTOM_TAGS' ) )
  42      define( 'BP_CUSTOM_TAGS', false );
  44  if ( ! BP_CUSTOM_TAGS ) {
  45      /**
  46       * Kses global for default allowable HTML tags.
  47       *
  48       * Can be override by using CUSTOM_TAGS constant.
  49       *
  50       * @global array $allowedposttags
  51       * @since 2.0.0
  52       */
  53      $allowedposttags = array(
  54          'address' => array(),
  55          'a' => array(
  56              'class' => array (),
  57              'href' => array (),
  58              'id' => array (),
  59              'title' => array (),
  60              'rel' => array (),
  61              'rev' => array (),
  62              'name' => array (),
  63              'target' => array()),
  64          'abbr' => array(
  65              'class' => array (),
  66              'title' => array ()),
  67          'acronym' => array(
  68              'title' => array ()),
  69          'article' => array(
  70              'align' => array (),
  71              'class' => array (),
  72              'dir' => array (),
  73              'lang' => array(),
  74              'style' => array (),
  75              'xml:lang' => array(),
  76          ),
  77          'aside' => array(
  78              'align' => array (),
  79              'class' => array (),
  80              'dir' => array (),
  81              'lang' => array(),
  82              'style' => array (),
  83              'xml:lang' => array(),
  84          ),
  85          'b' => array(),
  86          'big' => array(),
  87          'blockquote' => array(
  88              'id' => array (),
  89              'cite' => array (),
  90              'class' => array(),
  91              'lang' => array(),
  92              'xml:lang' => array()),
  93          'br' => array (
  94              'class' => array ()),
  95          'button' => array(
  96              'disabled' => array (),
  97              'name' => array (),
  98              'type' => array (),
  99              'value' => array ()),
 100          'caption' => array(
 101              'align' => array (),
 102              'class' => array ()),
 103          'cite' => array (
 104              'class' => array(),
 105              'dir' => array(),
 106              'lang' => array(),
 107              'title' => array ()),
 108          'code' => array (
 109              'style' => array()),
 110          'col' => array(
 111              'align' => array (),
 112              'char' => array (),
 113              'charoff' => array (),
 114              'span' => array (),
 115              'dir' => array(),
 116              'style' => array (),
 117              'valign' => array (),
 118              'width' => array ()),
 119          'del' => array(
 120              'datetime' => array ()),
 121          'dd' => array(),
 122          'details' => array(
 123              'align' => array (),
 124              'class' => array (),
 125              'dir' => array (),
 126              'lang' => array(),
 127              'open' => array (),
 128              'style' => array (),
 129              'xml:lang' => array(),
 130          ),
 131          'div' => array(
 132              'align' => array (),
 133              'class' => array (),
 134              'dir' => array (),
 135              'lang' => array(),
 136              'style' => array (),
 137              'xml:lang' => array()),
 138          'dl' => array(),
 139          'dt' => array(),
 140          'em' => array(),
 141          'fieldset' => array(),
 142          'figure' => array(
 143              'align' => array (),
 144              'class' => array (),
 145              'dir' => array (),
 146              'lang' => array(),
 147              'style' => array (),
 148              'xml:lang' => array(),
 149          ),
 150          'figcaption' => array(
 151              'align' => array (),
 152              'class' => array (),
 153              'dir' => array (),
 154              'lang' => array(),
 155              'style' => array (),
 156              'xml:lang' => array(),
 157          ),
 158          'font' => array(
 159              'color' => array (),
 160              'face' => array (),
 161              'size' => array ()),
 162          'footer' => array(
 163              'align' => array (),
 164              'class' => array (),
 165              'dir' => array (),
 166              'lang' => array(),
 167              'style' => array (),
 168              'xml:lang' => array(),
 169          ),
 170          'form' => array(
 171              'action' => array (),
 172              'accept' => array (),
 173              'accept-charset' => array (),
 174              'enctype' => array (),
 175              'method' => array (),
 176              'name' => array (),
 177              'target' => array ()),
 178          'h1' => array(
 179              'align' => array (),
 180              'class' => array (),
 181              'id'    => array (),
 182              'style' => array ()),
 183          'h2' => array (
 184              'align' => array (),
 185              'class' => array (),
 186              'id'    => array (),
 187              'style' => array ()),
 188          'h3' => array (
 189              'align' => array (),
 190              'class' => array (),
 191              'id'    => array (),
 192              'style' => array ()),
 193          'h4' => array (
 194              'align' => array (),
 195              'class' => array (),
 196              'id'    => array (),
 197              'style' => array ()),
 198          'h5' => array (
 199              'align' => array (),
 200              'class' => array (),
 201              'id'    => array (),
 202              'style' => array ()),
 203          'h6' => array (
 204              'align' => array (),
 205              'class' => array (),
 206              'id'    => array (),
 207              'style' => array ()),
 208          'header' => array(
 209              'align' => array (),
 210              'class' => array (),
 211              'dir' => array (),
 212              'lang' => array(),
 213              'style' => array (),
 214              'xml:lang' => array(),
 215          ),
 216          'hgroup' => array(
 217              'align' => array (),
 218              'class' => array (),
 219              'dir' => array (),
 220              'lang' => array(),
 221              'style' => array (),
 222              'xml:lang' => array(),
 223          ),
 224          'hr' => array (
 225              'align' => array (),
 226              'class' => array (),
 227              'noshade' => array (),
 228              'size' => array (),
 229              'width' => array ()),
 230          'i' => array(),
 231          'img' => array(
 232              'alt' => array (),
 233              'align' => array (),
 234              'border' => array (),
 235              'class' => array (),
 236              'height' => array (),
 237              'hspace' => array (),
 238              'longdesc' => array (),
 239              'vspace' => array (),
 240              'src' => array (),
 241              'style' => array (),
 242              'width' => array ()),
 243          'ins' => array(
 244              'datetime' => array (),
 245              'cite' => array ()),
 246          'kbd' => array(),
 247          'label' => array(
 248              'for' => array ()),
 249          'legend' => array(
 250              'align' => array ()),
 251          'li' => array (
 252              'align' => array (),
 253              'class' => array ()),
 254          'menu' => array (
 255              'class' => array (),
 256              'style' => array (),
 257              'type' => array ()),
 258          'nav' => array(
 259              'align' => array (),
 260              'class' => array (),
 261              'dir' => array (),
 262              'lang' => array(),
 263              'style' => array (),
 264              'xml:lang' => array(),
 265          ),
 266          'p' => array(
 267              'class' => array (),
 268              'align' => array (),
 269              'dir' => array(),
 270              'lang' => array(),
 271              'style' => array (),
 272              'xml:lang' => array()),
 273          'pre' => array(
 274              'style' => array(),
 275              'width' => array ()),
 276          'q' => array(
 277              'cite' => array ()),
 278          's' => array(),
 279          'span' => array (
 280              'class' => array (),
 281              'dir' => array (),
 282              'align' => array (),
 283              'lang' => array (),
 284              'style' => array (),
 285              'title' => array (),
 286              'xml:lang' => array()),
 287          'section' => array(
 288              'align' => array (),
 289              'class' => array (),
 290              'dir' => array (),
 291              'lang' => array(),
 292              'style' => array (),
 293              'xml:lang' => array(),
 294          ),
 295          'strike' => array(),
 296          'strong' => array(),
 297          'sub' => array(),
 298          'summary' => array(
 299              'align' => array (),
 300              'class' => array (),
 301              'dir' => array (),
 302              'lang' => array(),
 303              'style' => array (),
 304              'xml:lang' => array(),
 305          ),
 306          'sup' => array(),
 307          'table' => array(
 308              'align' => array (),
 309              'bgcolor' => array (),
 310              'border' => array (),
 311              'cellpadding' => array (),
 312              'cellspacing' => array (),
 313              'class' => array (),
 314              'dir' => array(),
 315              'id' => array(),
 316              'rules' => array (),
 317              'style' => array (),
 318              'summary' => array (),
 319              'width' => array ()),
 320          'tbody' => array(
 321              'align' => array (),
 322              'char' => array (),
 323              'charoff' => array (),
 324              'valign' => array ()),
 325          'td' => array(
 326              'abbr' => array (),
 327              'align' => array (),
 328              'axis' => array (),
 329              'bgcolor' => array (),
 330              'char' => array (),
 331              'charoff' => array (),
 332              'class' => array (),
 333              'colspan' => array (),
 334              'dir' => array(),
 335              'headers' => array (),
 336              'height' => array (),
 337              'nowrap' => array (),
 338              'rowspan' => array (),
 339              'scope' => array (),
 340              'style' => array (),
 341              'valign' => array (),
 342              'width' => array ()),
 343          'textarea' => array(
 344              'cols' => array (),
 345              'rows' => array (),
 346              'disabled' => array (),
 347              'name' => array (),
 348              'readonly' => array ()),
 349          'tfoot' => array(
 350              'align' => array (),
 351              'char' => array (),
 352              'class' => array (),
 353              'charoff' => array (),
 354              'valign' => array ()),
 355          'th' => array(
 356              'abbr' => array (),
 357              'align' => array (),
 358              'axis' => array (),
 359              'bgcolor' => array (),
 360              'char' => array (),
 361              'charoff' => array (),
 362              'class' => array (),
 363              'colspan' => array (),
 364              'headers' => array (),
 365              'height' => array (),
 366              'nowrap' => array (),
 367              'rowspan' => array (),
 368              'scope' => array (),
 369              'valign' => array (),
 370              'width' => array ()),
 371          'thead' => array(
 372              'align' => array (),
 373              'char' => array (),
 374              'charoff' => array (),
 375              'class' => array (),
 376              'valign' => array ()),
 377          'title' => array(),
 378          'tr' => array(
 379              'align' => array (),
 380              'bgcolor' => array (),
 381              'char' => array (),
 382              'charoff' => array (),
 383              'class' => array (),
 384              'style' => array (),
 385              'valign' => array ()),
 386          'tt' => array(),
 387          'u' => array(),
 388          'ul' => array (
 389              'class' => array (),
 390              'style' => array (),
 391              'type' => array ()),
 392          'ol' => array (
 393              'class' => array (),
 394              'start' => array (),
 395              'style' => array (),
 396              'type' => array ()),
 397          'var' => array ());
 399      /**
 400       * Kses allowed HTML elements.
 401       *
 402       * @global array $allowedtags
 403       * @since 1.0.0
 404       */
 405      $allowedtags = array(
 406          'a' => array(
 407              'href' => array (),
 408              'title' => array ()),
 409          'abbr' => array(
 410              'title' => array ()),
 411          'acronym' => array(
 412              'title' => array ()),
 413          'b' => array(),
 414          'blockquote' => array(
 415              'cite' => array ()),
 416          //    'br' => array(),
 417          'cite' => array (),
 418          'code' => array(),
 419          'del' => array(
 420              'datetime' => array ()),
 421          //    'dd' => array(),
 422          //    'dl' => array(),
 423          //    'dt' => array(),
 424          'em' => array (), 'i' => array (),
 425          //    'ins' => array('datetime' => array(), 'cite' => array()),
 426          //    'li' => array(),
 427          //    'ol' => array(),
 428          //    'p' => array(),
 429          'q' => array(
 430              'cite' => array ()),
 431          'strike' => array(),
 432          'strong' => array(),
 433          //    'sub' => array(),
 434          //    'sup' => array(),
 435          //    'u' => array(),
 436          //    'ul' => array(),
 437      );
 439      $allowedentitynames = array(
 440          'nbsp',    'iexcl',  'cent',    'pound',  'curren', 'yen',
 441          'brvbar',  'sect',   'uml',     'copy',   'ordf',   'laquo',
 442          'not',     'shy',    'reg',     'macr',   'deg',    'plusmn',
 443          'acute',   'micro',  'para',    'middot', 'cedil',  'ordm',
 444          'raquo',   'iquest', 'Agrave',  'Aacute', 'Acirc',  'Atilde',
 445          'Auml',    'Aring',  'AElig',   'Ccedil', 'Egrave', 'Eacute',
 446          'Ecirc',   'Euml',   'Igrave',  'Iacute', 'Icirc',  'Iuml',
 447          'ETH',     'Ntilde', 'Ograve',  'Oacute', 'Ocirc',  'Otilde',
 448          'Ouml',    'times',  'Oslash',  'Ugrave', 'Uacute', 'Ucirc',
 449          'Uuml',    'Yacute', 'THORN',   'szlig',  'agrave', 'aacute',
 450          'acirc',   'atilde', 'auml',    'aring',  'aelig',  'ccedil',
 451          'egrave',  'eacute', 'ecirc',   'euml',   'igrave', 'iacute',
 452          'icirc',   'iuml',   'eth',     'ntilde', 'ograve', 'oacute',
 453          'ocirc',   'otilde', 'ouml',    'divide', 'oslash', 'ugrave',
 454          'uacute',  'ucirc',  'uuml',    'yacute', 'thorn',  'yuml',
 455          'quot',    'amp',    'lt',      'gt',     'apos',   'OElig',
 456          'oelig',   'Scaron', 'scaron',  'Yuml',   'circ',   'tilde',
 457          'ensp',    'emsp',   'thinsp',  'zwnj',   'zwj',    'lrm',
 458          'rlm',     'ndash',  'mdash',   'lsquo',  'rsquo',  'sbquo',
 459          'ldquo',   'rdquo',  'bdquo',   'dagger', 'Dagger', 'permil',
 460          'lsaquo',  'rsaquo', 'euro',    'fnof',   'Alpha',  'Beta',
 461          'Gamma',   'Delta',  'Epsilon', 'Zeta',   'Eta',    'Theta',
 462          'Iota',    'Kappa',  'Lambda',  'Mu',     'Nu',     'Xi',
 463          'Omicron', 'Pi',     'Rho',     'Sigma',  'Tau',    'Upsilon',
 464          'Phi',     'Chi',    'Psi',     'Omega',  'alpha',  'beta',
 465          'gamma',   'delta',  'epsilon', 'zeta',   'eta',    'theta',
 466          'iota',    'kappa',  'lambda',  'mu',     'nu',     'xi',
 467          'omicron', 'pi',     'rho',     'sigmaf', 'sigma',  'tau',
 468          'upsilon', 'phi',    'chi',     'psi',    'omega',  'thetasym',
 469          'upsih',   'piv',    'bull',    'hellip', 'prime',  'Prime',
 470          'oline',   'frasl',  'weierp',  'image',  'real',   'trade',
 471          'alefsym', 'larr',   'uarr',    'rarr',   'darr',   'harr',
 472          'crarr',   'lArr',   'uArr',    'rArr',   'dArr',   'hArr',
 473          'forall',  'part',   'exist',   'empty',  'nabla',  'isin',
 474          'notin',   'ni',     'prod',    'sum',    'minus',  'lowast',
 475          'radic',   'prop',   'infin',   'ang',    'and',    'or',
 476          'cap',     'cup',    'int',     'sim',    'cong',   'asymp',
 477          'ne',      'equiv',  'le',      'ge',     'sub',    'sup',
 478          'nsub',    'sube',   'supe',    'oplus',  'otimes', 'perp',
 479          'sdot',    'lceil',  'rceil',   'lfloor', 'rfloor', 'lang',
 480          'rang',    'loz',    'spades',  'clubs',  'hearts', 'diams',
 481      );
 482  }
 484  /**
 485   * Filters content and keeps only allowable HTML elements.
 486   *
 487   * This function makes sure that only the allowed HTML element names, attribute
 488   * names and attribute values plus only sane HTML entities will occur in
 489   * $string. You have to remove any slashes from PHP's magic quotes before you
 490   * call this function.
 491   *
 492   * The default allowed protocols are 'http', 'https', 'ftp', 'mailto', 'news',
 493   * 'irc', 'gopher', 'nntp', 'feed', 'telnet, 'mms', 'rtsp' and 'svn'. This
 494   * covers all common link protocols, except for 'javascript' which should not
 495   * be allowed for untrusted users.
 496   *
 497   * @since 1.0.0
 498   *
 499   * @param string $string Content to filter through kses
 500   * @param array $allowed_html List of allowed HTML elements
 501   * @param array $allowed_protocols Optional. Allowed protocol in links.
 502   * @return string Filtered content with only allowed HTML elements
 503   */
 504  function wp_kses($string, $allowed_html, $allowed_protocols = array ()) {
 505      $allowed_protocols = wp_parse_args( $allowed_protocols, apply_filters('kses_allowed_protocols', array ('http', 'https', 'ftp', 'ftps', 'mailto', 'news', 'irc', 'gopher', 'nntp', 'feed', 'telnet', 'mms', 'rtsp', 'svn') ));
 506      $string = wp_kses_no_null($string);
 507      $string = wp_kses_js_entities($string);
 508      $string = wp_kses_normalize_entities($string);
 509      $allowed_html_fixed = wp_kses_array_lc($allowed_html);
 510      $string = wp_kses_hook($string, $allowed_html_fixed, $allowed_protocols); // WP changed the order of these funcs and added args to wp_kses_hook
 511      return wp_kses_split($string, $allowed_html_fixed, $allowed_protocols);
 512  }
 514  /**
 515   * You add any kses hooks here.
 516   *
 517   * There is currently only one kses WordPress hook and it is called here. All
 518   * parameters are passed to the hooks and expected to recieve a string.
 519   *
 520   * @since 1.0.0
 521   *
 522   * @param string $string Content to filter through kses
 523   * @param array $allowed_html List of allowed HTML elements
 524   * @param array $allowed_protocols Allowed protocol in links
 525   * @return string Filtered content through 'pre_kses' hook
 526   */
 527  function wp_kses_hook($string, $allowed_html, $allowed_protocols) {
 528      $string = apply_filters('pre_kses', $string, $allowed_html, $allowed_protocols);
 529      return $string;
 530  }
 532  /**
 533   * This function returns kses' version number.
 534   *
 535   * @since 1.0.0
 536   *
 537   * @return string KSES Version Number
 538   */
 539  function wp_kses_version() {
 540      return '0.2.2';
 541  }
 543  /**
 544   * Searches for HTML tags, no matter how malformed.
 545   *
 546   * It also matches stray ">" characters.
 547   *
 548   * @since 1.0.0
 549   *
 550   * @param string $string Content to filter
 551   * @param array $allowed_html Allowed HTML elements
 552   * @param array $allowed_protocols Allowed protocols to keep
 553   * @return string Content with fixed HTML tags
 554   */
 555  function wp_kses_split($string, $allowed_html, $allowed_protocols) {
 556      global $pass_allowed_html, $pass_allowed_protocols;
 557      $pass_allowed_html = $allowed_html;
 558      $pass_allowed_protocols = $allowed_protocols;
 559      return preg_replace_callback( '%((<!--.*?(-->|$))|(<[^>]*(>|$)|>))%', '_wp_kses_split_callback', $string );
 560  }
 562  /**
 563   * Callback for wp_kses_split.
 564   *
 565   * @since 3.1.0
 566   * @access private
 567   */
 568  function _wp_kses_split_callback( $match ) {
 569      global $pass_allowed_html, $pass_allowed_protocols;
 570      return wp_kses_split2( $match[1], $pass_allowed_html, $pass_allowed_protocols );
 571  }
 573  /**
 574   * Callback for wp_kses_split for fixing malformed HTML tags.
 575   *
 576   * This function does a lot of work. It rejects some very malformed things like
 577   * <:::>. It returns an empty string, if the element isn't allowed (look ma, no
 578   * strip_tags()!). Otherwise it splits the tag into an element and an attribute
 579   * list.
 580   *
 581   * After the tag is split into an element and an attribute list, it is run
 582   * through another filter which will remove illegal attributes and once that is
 583   * completed, will be returned.
 584   *
 585   * @access private
 586   * @since 1.0.0
 587   * @uses wp_kses_attr()
 588   *
 589   * @param string $string Content to filter
 590   * @param array $allowed_html Allowed HTML elements
 591   * @param array $allowed_protocols Allowed protocols to keep
 592   * @return string Fixed HTML element
 593   */
 594  function wp_kses_split2($string, $allowed_html, $allowed_protocols) {
 595      $string = wp_kses_stripslashes($string);
 597      if (substr($string, 0, 1) != '<')
 598          return '&gt;';
 599      # It matched a ">" character
 601      if (preg_match('%^<!--(.*?)(-->)?$%', $string, $matches)) {
 602          $string = str_replace(array('<!--', '-->'), '', $matches[1]);
 603          while ( $string != $newstring = wp_kses($string, $allowed_html, $allowed_protocols) )
 604              $string = $newstring;
 605          if ( $string == '' )
 606              return '';
 607          // prevent multiple dashes in comments
 608          $string = preg_replace('/--+/', '-', $string);
 609          // prevent three dashes closing a comment
 610          $string = preg_replace('/-$/', '', $string);
 611          return "<!--{$string}-->";
 612      }
 613      # Allow HTML comments
 615      if (!preg_match('%^<\s*(/\s*)?([a-zA-Z0-9]+)([^>]*)>?$%', $string, $matches))
 616          return '';
 617      # It's seriously malformed
 619      $slash = trim($matches[1]);
 620      $elem = $matches[2];
 621      $attrlist = $matches[3];
 623      if (!@isset($allowed_html[strtolower($elem)]))
 624          return '';
 625      # They are using a not allowed HTML element
 627      if ($slash != '')
 628          return "<$slash$elem>";
 629      # No attributes are allowed for closing elements
 631      return wp_kses_attr("$slash$elem", $attrlist, $allowed_html, $allowed_protocols);
 632  }
 634  /**
 635   * Removes all attributes, if none are allowed for this element.
 636   *
 637   * If some are allowed it calls wp_kses_hair() to split them further, and then
 638   * it builds up new HTML code from the data that kses_hair() returns. It also
 639   * removes "<" and ">" characters, if there are any left. One more thing it does
 640   * is to check if the tag has a closing XHTML slash, and if it does, it puts one
 641   * in the returned code as well.
 642   *
 643   * @since 1.0.0
 644   *
 645   * @param string $element HTML element/tag
 646   * @param string $attr HTML attributes from HTML element to closing HTML element tag
 647   * @param array $allowed_html Allowed HTML elements
 648   * @param array $allowed_protocols Allowed protocols to keep
 649   * @return string Sanitized HTML element
 650   */
 651  function wp_kses_attr($element, $attr, $allowed_html, $allowed_protocols) {
 652      # Is there a closing XHTML slash at the end of the attributes?
 654      $xhtml_slash = '';
 655      if (preg_match('%\s*/\s*$%', $attr))
 656          $xhtml_slash = ' /';
 658      # Are any attributes allowed at all for this element?
 660      if (@ count($allowed_html[strtolower($element)]) == 0)
 661          return "<$element$xhtml_slash>";
 663      # Split it
 665      $attrarr = wp_kses_hair($attr, $allowed_protocols);
 667      # Go through $attrarr, and save the allowed attributes for this element
 668      # in $attr2
 670      $attr2 = '';
 672      foreach ($attrarr as $arreach) {
 673          if (!@ isset ($allowed_html[strtolower($element)][strtolower($arreach['name'])]))
 674              continue; # the attribute is not allowed
 676          $current = $allowed_html[strtolower($element)][strtolower($arreach['name'])];
 677          if ($current == '')
 678              continue; # the attribute is not allowed
 680          if (!is_array($current))
 681              $attr2 .= ' '.$arreach['whole'];
 682          # there are no checks
 684          else {
 685              # there are some checks
 686              $ok = true;
 687              foreach ($current as $currkey => $currval)
 688                  if (!wp_kses_check_attr_val($arreach['value'], $arreach['vless'], $currkey, $currval)) {
 689                      $ok = false;
 690                      break;
 691                  }
 693              if ( strtolower($arreach['name']) == 'style' ) {
 694                  $orig_value = $arreach['value'];
 696                  $value = safecss_filter_attr($orig_value);
 698                  if ( empty($value) )
 699                      continue;
 701                  $arreach['value'] = $value;
 703                  $arreach['whole'] = str_replace($orig_value, $value, $arreach['whole']);
 704              }
 706              if ($ok)
 707                  $attr2 .= ' '.$arreach['whole']; # it passed them
 708          } # if !is_array($current)
 709      } # foreach
 711      # Remove any "<" or ">" characters
 713      $attr2 = preg_replace('/[<>]/', '', $attr2);
 715      return "<$element$attr2$xhtml_slash>";
 716  }
 718  /**
 719   * Builds an attribute list from string containing attributes.
 720   *
 721   * This function does a lot of work. It parses an attribute list into an array
 722   * with attribute data, and tries to do the right thing even if it gets weird
 723   * input. It will add quotes around attribute values that don't have any quotes
 724   * or apostrophes around them, to make it easier to produce HTML code that will
 725   * conform to W3C's HTML specification. It will also remove bad URL protocols
 726   * from attribute values.  It also reduces duplicate attributes by using the
 727   * attribute defined first (foo='bar' foo='baz' will result in foo='bar').
 728   *
 729   * @since 1.0.0
 730   *
 731   * @param string $attr Attribute list from HTML element to closing HTML element tag
 732   * @param array $allowed_protocols Allowed protocols to keep
 733   * @return array List of attributes after parsing
 734   */
 735  function wp_kses_hair($attr, $allowed_protocols) {
 736      $attrarr = array ();
 737      $mode = 0;
 738      $attrname = '';
 739      $uris = array('xmlns', 'profile', 'href', 'src', 'cite', 'classid', 'codebase', 'data', 'usemap', 'longdesc', 'action');
 741      # Loop through the whole attribute list
 743      while (strlen($attr) != 0) {
 744          $working = 0; # Was the last operation successful?
 746          switch ($mode) {
 747              case 0 : # attribute name, href for instance
 749                  if (preg_match('/^([-a-zA-Z]+)/', $attr, $match)) {
 750                      $attrname = $match[1];
 751                      $working = $mode = 1;
 752                      $attr = preg_replace('/^[-a-zA-Z]+/', '', $attr);
 753                  }
 755                  break;
 757              case 1 : # equals sign or valueless ("selected")
 759                  if (preg_match('/^\s*=\s*/', $attr)) # equals sign
 760                      {
 761                      $working = 1;
 762                      $mode = 2;
 763                      $attr = preg_replace('/^\s*=\s*/', '', $attr);
 764                      break;
 765                  }
 767                  if (preg_match('/^\s+/', $attr)) # valueless
 768                      {
 769                      $working = 1;
 770                      $mode = 0;
 771                      if(FALSE === array_key_exists($attrname, $attrarr)) {
 772                          $attrarr[$attrname] = array ('name' => $attrname, 'value' => '', 'whole' => $attrname, 'vless' => 'y');
 773                      }
 774                      $attr = preg_replace('/^\s+/', '', $attr);
 775                  }
 777                  break;
 779              case 2 : # attribute value, a URL after href= for instance
 781                  if (preg_match('%^"([^"]*)"(\s+|/?$)%', $attr, $match))
 782                      # "value"
 783                      {
 784                      $thisval = $match[1];
 785                      if ( in_array(strtolower($attrname), $uris) )
 786                          $thisval = wp_kses_bad_protocol($thisval, $allowed_protocols);
 788                      if(FALSE === array_key_exists($attrname, $attrarr)) {
 789                          $attrarr[$attrname] = array ('name' => $attrname, 'value' => $thisval, 'whole' => "$attrname=\"$thisval\"", 'vless' => 'n');
 790                      }
 791                      $working = 1;
 792                      $mode = 0;
 793                      $attr = preg_replace('/^"[^"]*"(\s+|$)/', '', $attr);
 794                      break;
 795                  }
 797                  if (preg_match("%^'([^']*)'(\s+|/?$)%", $attr, $match))
 798                      # 'value'
 799                      {
 800                      $thisval = $match[1];
 801                      if ( in_array(strtolower($attrname), $uris) )
 802                          $thisval = wp_kses_bad_protocol($thisval, $allowed_protocols);
 804                      if(FALSE === array_key_exists($attrname, $attrarr)) {
 805                          $attrarr[$attrname] = array ('name' => $attrname, 'value' => $thisval, 'whole' => "$attrname='$thisval'", 'vless' => 'n');
 806                      }
 807                      $working = 1;
 808                      $mode = 0;
 809                      $attr = preg_replace("/^'[^']*'(\s+|$)/", '', $attr);
 810                      break;
 811                  }
 813                  if (preg_match("%^([^\s\"']+)(\s+|/?$)%", $attr, $match))
 814                      # value
 815                      {
 816                      $thisval = $match[1];
 817                      if ( in_array(strtolower($attrname), $uris) )
 818                          $thisval = wp_kses_bad_protocol($thisval, $allowed_protocols);
 820                      if(FALSE === array_key_exists($attrname, $attrarr)) {
 821                          $attrarr[$attrname] = array ('name' => $attrname, 'value' => $thisval, 'whole' => "$attrname=\"$thisval\"", 'vless' => 'n');
 822                      }
 823                      # We add quotes to conform to W3C's HTML spec.
 824                      $working = 1;
 825                      $mode = 0;
 826                      $attr = preg_replace("%^[^\s\"']+(\s+|$)%", '', $attr);
 827                  }
 829                  break;
 830          } # switch
 832          if ($working == 0) # not well formed, remove and try again
 833          {
 834              $attr = wp_kses_html_error($attr);
 835              $mode = 0;
 836          }
 837      } # while
 839      if ($mode == 1 && FALSE === array_key_exists($attrname, $attrarr))
 840          # special case, for when the attribute list ends with a valueless
 841          # attribute like "selected"
 842          $attrarr[$attrname] = array ('name' => $attrname, 'value' => '', 'whole' => $attrname, 'vless' => 'y');
 844      return $attrarr;
 845  }
 847  /**
 848   * Performs different checks for attribute values.
 849   *
 850   * The currently implemented checks are "maxlen", "minlen", "maxval", "minval"
 851   * and "valueless" with even more checks to come soon.
 852   *
 853   * @since 1.0.0
 854   *
 855   * @param string $value Attribute value
 856   * @param string $vless Whether the value is valueless. Use 'y' or 'n'
 857   * @param string $checkname What $checkvalue is checking for.
 858   * @param mixed $checkvalue What constraint the value should pass
 859   * @return bool Whether check passes
 860   */
 861  function wp_kses_check_attr_val($value, $vless, $checkname, $checkvalue) {
 862      $ok = true;
 864      switch (strtolower($checkname)) {
 865          case 'maxlen' :
 866              # The maxlen check makes sure that the attribute value has a length not
 867              # greater than the given value. This can be used to avoid Buffer Overflows
 868              # in WWW clients and various Internet servers.
 870              if (strlen($value) > $checkvalue)
 871                  $ok = false;
 872              break;
 874          case 'minlen' :
 875              # The minlen check makes sure that the attribute value has a length not
 876              # smaller than the given value.
 878              if (strlen($value) < $checkvalue)
 879                  $ok = false;
 880              break;
 882          case 'maxval' :
 883              # The maxval check does two things: it checks that the attribute value is
 884              # an integer from 0 and up, without an excessive amount of zeroes or
 885              # whitespace (to avoid Buffer Overflows). It also checks that the attribute
 886              # value is not greater than the given value.
 887              # This check can be used to avoid Denial of Service attacks.
 889              if (!preg_match('/^\s{0,6}[0-9]{1,6}\s{0,6}$/', $value))
 890                  $ok = false;
 891              if ($value > $checkvalue)
 892                  $ok = false;
 893              break;
 895          case 'minval' :
 896              # The minval check checks that the attribute value is a positive integer,
 897              # and that it is not smaller than the given value.
 899              if (!preg_match('/^\s{0,6}[0-9]{1,6}\s{0,6}$/', $value))
 900                  $ok = false;
 901              if ($value < $checkvalue)
 902                  $ok = false;
 903              break;
 905          case 'valueless' :
 906              # The valueless check checks if the attribute has a value
 907              # (like <a href="blah">) or not (<option selected>). If the given value
 908              # is a "y" or a "Y", the attribute must not have a value.
 909              # If the given value is an "n" or an "N", the attribute must have one.
 911              if (strtolower($checkvalue) != $vless)
 912                  $ok = false;
 913              break;
 914      } # switch
 916      return $ok;
 917  }
 919  /**
 920   * Sanitize string from bad protocols.
 921   *
 922   * This function removes all non-allowed protocols from the beginning of
 923   * $string. It ignores whitespace and the case of the letters, and it does
 924   * understand HTML entities. It does its work in a while loop, so it won't be
 925   * fooled by a string like "javascript:javascript:alert(57)".
 926   *
 927   * @since 1.0.0
 928   *
 929   * @param string $string Content to filter bad protocols from
 930   * @param array $allowed_protocols Allowed protocols to keep
 931   * @return string Filtered content
 932   */
 933  function wp_kses_bad_protocol($string, $allowed_protocols) {
 934      $string = wp_kses_no_null($string);
 935      $string2 = $string.'a';
 937      while ($string != $string2) {
 938          $string2 = $string;
 939          $string = wp_kses_bad_protocol_once($string, $allowed_protocols);
 940      } # while
 942      return $string;
 943  }
 945  /**
 946   * Removes any NULL characters in $string.
 947   *
 948   * @since 1.0.0
 949   *
 950   * @param string $string
 951   * @return string
 952   */
 953  function wp_kses_no_null($string) {
 954      $string = preg_replace('/\0+/', '', $string);
 955      $string = preg_replace('/(\\\\0)+/', '', $string);
 957      return $string;
 958  }
 960  /**
 961   * Strips slashes from in front of quotes.
 962   *
 963   * This function changes the character sequence  \"  to just  ". It leaves all
 964   * other slashes alone. It's really weird, but the quoting from
 965   * preg_replace(//e) seems to require this.
 966   *
 967   * @since 1.0.0
 968   *
 969   * @param string $string String to strip slashes
 970   * @return string Fixed strings with quoted slashes
 971   */
 972  function wp_kses_stripslashes($string) {
 973      return preg_replace('%\\\\"%', '"', $string);
 974  }
 976  /**
 977   * Goes through an array and changes the keys to all lower case.
 978   *
 979   * @since 1.0.0
 980   *
 981   * @param array $inarray Unfiltered array
 982   * @return array Fixed array with all lowercase keys
 983   */
 984  function wp_kses_array_lc($inarray) {
 985      $outarray = array ();
 987      foreach ( (array) $inarray as $inkey => $inval) {
 988          $outkey = strtolower($inkey);
 989          $outarray[$outkey] = array ();
 991          foreach ( (array) $inval as $inkey2 => $inval2) {
 992              $outkey2 = strtolower($inkey2);
 993              $outarray[$outkey][$outkey2] = $inval2;
 994          } # foreach $inval
 995      } # foreach $inarray
 997      return $outarray;
 998  }
1000  /**
1001   * Removes the HTML JavaScript entities found in early versions of Netscape 4.
1002   *
1003   * @since 1.0.0
1004   *
1005   * @param string $string
1006   * @return string
1007   */
1008  function wp_kses_js_entities($string) {
1009      return preg_replace('%&\s*\{[^}]*(\}\s*;?|$)%', '', $string);
1010  }
1012  /**
1013   * Handles parsing errors in wp_kses_hair().
1014   *
1015   * The general plan is to remove everything to and including some whitespace,
1016   * but it deals with quotes and apostrophes as well.
1017   *
1018   * @since 1.0.0
1019   *
1020   * @param string $string
1021   * @return string
1022   */
1023  function wp_kses_html_error($string) {
1024      return preg_replace('/^("[^"]*("|$)|\'[^\']*(\'|$)|\S)*\s*/', '', $string);
1025  }
1027  /**
1028   * Sanitizes content from bad protocols and other characters.
1029   *
1030   * This function searches for URL protocols at the beginning of $string, while
1031   * handling whitespace and HTML entities.
1032   *
1033   * @since 1.0.0
1034   *
1035   * @param string $string Content to check for bad protocols
1036   * @param string $allowed_protocols Allowed protocols
1037   * @return string Sanitized content
1038   */
1039  function wp_kses_bad_protocol_once($string, $allowed_protocols) {
1040      $string2 = preg_split( '/:|&#0*58;|&#x0*3a;/i', $string, 2 );
1041      if ( isset($string2[1]) && ! preg_match('%/\?%', $string2[0]) )
1042          $string = wp_kses_bad_protocol_once2( $string2[0], $allowed_protocols ) . trim( $string2[1] );
1044      return $string;
1045  }
1047  /**
1048   * Callback for wp_kses_bad_protocol_once() regular expression.
1049   *
1050   * This function processes URL protocols, checks to see if they're in the
1051   * white-list or not, and returns different data depending on the answer.
1052   *
1053   * @access private
1054   * @since 1.0.0
1055   *
1056   * @param string $string URI scheme to check against the whitelist
1057   * @param string $allowed_protocols Allowed protocols
1058   * @return string Sanitized content
1059   */
1060  function wp_kses_bad_protocol_once2( $string, $allowed_protocols ) {
1061      $string2 = wp_kses_decode_entities($string);
1062      $string2 = preg_replace('/\s/', '', $string2);
1063      $string2 = wp_kses_no_null($string2);
1064      $string2 = strtolower($string2);
1066      $allowed = false;
1067      foreach ( (array) $allowed_protocols as $one_protocol ) {
1068          if ( strtolower($one_protocol) == $string2 ) {
1069              $allowed = true;
1070              break;
1071          }
1072      }
1074      if ($allowed)
1075          return "$string2:";
1076      else
1077          return '';
1078  }
1080  /**
1081   * Converts and fixes HTML entities.
1082   *
1083   * This function normalizes HTML entities. It will convert "AT&T" to the correct
1084   * "AT&amp;T", "&#00058;" to "&#58;", "&#XYZZY;" to "&amp;#XYZZY;" and so on.
1085   *
1086   * @since 1.0.0
1087   *
1088   * @param string $string Content to normalize entities
1089   * @return string Content with normalized entities
1090   */
1091  function wp_kses_normalize_entities($string) {
1092      # Disarm all entities by converting & to &amp;
1094      $string = str_replace('&', '&amp;', $string);
1096      # Change back the allowed entities in our entity whitelist
1098      $string = preg_replace_callback('/&amp;([A-Za-z]{2,8});/', 'wp_kses_named_entities', $string);
1099      $string = preg_replace_callback('/&amp;#(0*[0-9]{1,7});/', 'wp_kses_normalize_entities2', $string);
1100      $string = preg_replace_callback('/&amp;#[Xx](0*[0-9A-Fa-f]{1,6});/', 'wp_kses_normalize_entities3', $string);
1102      return $string;
1103  }
1105  /**
1106   * Callback for wp_kses_normalize_entities() regular expression.
1107   *
1108   * This function only accepts valid named entity references, which are finite,
1109   * case-sensitive, and highly scrutinized by HTML and XML validators.
1110   *
1111   * @since 3.0.0
1112   *
1113   * @param array $matches preg_replace_callback() matches array
1114   * @return string Correctly encoded entity
1115   */
1116  function wp_kses_named_entities($matches) {
1117      global $allowedentitynames;
1119      if ( empty($matches[1]) )
1120          return '';
1122      $i = $matches[1];
1123      return ( ( ! in_array($i, $allowedentitynames) ) ? "&amp;$i;" : "&$i;" );
1124  }
1126  /**
1127   * Callback for wp_kses_normalize_entities() regular expression.
1128   *
1129   * This function helps wp_kses_normalize_entities() to only accept 16 bit values
1130   * and nothing more for &#number; entities.
1131   *
1132   * @access private
1133   * @since 1.0.0
1134   *
1135   * @param array $matches preg_replace_callback() matches array
1136   * @return string Correctly encoded entity
1137   */
1138  function wp_kses_normalize_entities2($matches) {
1139      if ( empty($matches[1]) )
1140          return '';
1142      $i = $matches[1];
1143      if (valid_unicode($i)) {
1144          $i = str_pad(ltrim($i,'0'), 3, '0', STR_PAD_LEFT);
1145          $i = "&#$i;";
1146      } else {
1147          $i = "&amp;#$i;";
1148      }
1150      return $i;
1151  }
1153  /**
1154   * Callback for wp_kses_normalize_entities() for regular expression.
1155   *
1156   * This function helps wp_kses_normalize_entities() to only accept valid Unicode
1157   * numeric entities in hex form.
1158   *
1159   * @access private
1160   *
1161   * @param array $matches preg_replace_callback() matches array
1162   * @return string Correctly encoded entity
1163   */
1164  function wp_kses_normalize_entities3($matches) {
1165      if ( empty($matches[1]) )
1166          return '';
1168      $hexchars = $matches[1];
1169      return ( ( ! valid_unicode(hexdec($hexchars)) ) ? "&amp;#x$hexchars;" : '&#x'.ltrim($hexchars,'0').';' );
1170  }
1172  /**
1173   * Helper function to determine if a Unicode value is valid.
1174   *
1175   * @param int $i Unicode value
1176   * @return bool true if the value was a valid Unicode number
1177   */
1178  function valid_unicode($i) {
1179      return ( $i == 0x9 || $i == 0xa || $i == 0xd ||
1180              ($i >= 0x20 && $i <= 0xd7ff) ||
1181              ($i >= 0xe000 && $i <= 0xfffd) ||
1182              ($i >= 0x10000 && $i <= 0x10ffff) );
1183  }
1185  /**
1186   * Convert all entities to their character counterparts.
1187   *
1188   * This function decodes numeric HTML entities (&#65; and &#x41;). It doesn't do
1189   * anything with other entities like &auml;, but we don't need them in the URL
1190   * protocol whitelisting system anyway.
1191   *
1192   * @since 1.0.0
1193   *
1194   * @param string $string Content to change entities
1195   * @return string Content after decoded entities
1196   */
1197  function wp_kses_decode_entities($string) {
1198      $string = preg_replace_callback('/&#([0-9]+);/', '_wp_kses_decode_entities_chr', $string);
1199      $string = preg_replace_callback('/&#[Xx]([0-9A-Fa-f]+);/', '_wp_kses_decode_entities_chr_hexdec', $string);
1201      return $string;
1202  }
1204  /**
1205   * Regex callback for wp_kses_decode_entities()
1206   *
1207   * @param array $match preg match
1208   * @return string
1209   */
1210  function _wp_kses_decode_entities_chr( $match ) {
1211      return chr( $match[1] );
1212  }
1214  /**
1215   * Regex callback for wp_kses_decode_entities()
1216   *
1217   * @param array $match preg match
1218   * @return string
1219   */
1220  function _wp_kses_decode_entities_chr_hexdec( $match ) {
1221      return chr( hexdec( $match[1] ) );
1222  }
1224  /**
1225   * Sanitize content with allowed HTML Kses rules.
1226   *
1227   * @since 1.0.0
1228   * @uses $allowedtags
1229   *
1230   * @param string $data Content to filter, expected to be escaped with slashes
1231   * @return string Filtered content
1232   */
1233  function wp_filter_kses($data) {
1234      global $allowedtags;
1235      return addslashes( wp_kses(stripslashes( $data ), $allowedtags) );
1236  }
1238  /**
1239   * Sanitize content with allowed HTML Kses rules.
1240   *
1241   * @since 2.9.0
1242   * @uses $allowedtags
1243   *
1244   * @param string $data Content to filter, expected to not be escaped
1245   * @return string Filtered content
1246   */
1247  function wp_kses_data($data) {
1248      global $allowedtags;
1249      return wp_kses( $data , $allowedtags );
1250  }
1252  /**
1253   * Sanitize content for allowed HTML tags for post content.
1254   *
1255   * Post content refers to the page contents of the 'post' type and not $_POST
1256   * data from forms.
1257   *
1258   * @since 2.0.0
1259   * @uses $allowedposttags
1260   *
1261   * @param string $data Post content to filter, expected to be escaped with slashes
1262   * @return string Filtered post content with allowed HTML tags and attributes intact.
1263   */
1264  function wp_filter_post_kses($data) {
1265      global $allowedposttags;
1266      return addslashes ( wp_kses(stripslashes( $data ), $allowedposttags) );
1267  }
1269  /**
1270   * Sanitize content for allowed HTML tags for post content.
1271   *
1272   * Post content refers to the page contents of the 'post' type and not $_POST
1273   * data from forms.
1274   *
1275   * @since 2.9.0
1276   * @uses $allowedposttags
1277   *
1278   * @param string $data Post content to filter
1279   * @return string Filtered post content with allowed HTML tags and attributes intact.
1280   */
1281  function wp_kses_post($data) {
1282      global $allowedposttags;
1283      return wp_kses( $data , $allowedposttags );
1284  }
1286  /**
1287   * Strips all of the HTML in the content.
1288   *
1289   * @since 2.1.0
1290   *
1291   * @param string $data Content to strip all HTML from
1292   * @return string Filtered content without any HTML
1293   */
1294  function wp_filter_nohtml_kses($data) {
1295      return addslashes ( wp_kses(stripslashes( $data ), array()) );
1296  }
1298  // ! function kses_init_filters()
1299  // ! function kses_remove_filters()
1300  // ! function kses_init()
1302  /**
1303   * Inline CSS filter
1304   *
1305   * @since 2.8.1
1306   */
1307  function safecss_filter_attr( $css, $deprecated = '' ) {
1308      if ( !empty( $deprecated ) )
1309          _deprecated_argument( __FUNCTION__, '2.8.1' ); // Never implemented
1311      $css = wp_kses_no_null($css);
1312      $css = str_replace(array("\n","\r","\t"), '', $css);
1314      if ( preg_match( '%[\\(&=}]|/\*%', $css ) ) // remove any inline css containing \ ( & } = or comments
1315          return '';
1317      $css_array = explode( ';', trim( $css ) );
1318      $allowed_attr = apply_filters( 'safe_style_css', array( 'text-align', 'margin', 'color', 'float',
1319      'border', 'background', 'background-color', 'border-bottom', 'border-bottom-color',
1320      'border-bottom-style', 'border-bottom-width', 'border-collapse', 'border-color', 'border-left',
1321      'border-left-color', 'border-left-style', 'border-left-width', 'border-right', 'border-right-color',
1322      'border-right-style', 'border-right-width', 'border-spacing', 'border-style', 'border-top',
1323      'border-top-color', 'border-top-style', 'border-top-width', 'border-width', 'caption-side',
1324      'clear', 'cursor', 'direction', 'font', 'font-family', 'font-size', 'font-style',
1325      'font-variant', 'font-weight', 'height', 'letter-spacing', 'line-height', 'margin-bottom',
1326      'margin-left', 'margin-right', 'margin-top', 'overflow', 'padding', 'padding-bottom',
1327      'padding-left', 'padding-right', 'padding-top', 'text-decoration', 'text-indent', 'vertical-align',
1328      'width' ) );
1330      if ( empty($allowed_attr) )
1331          return $css;
1333      $css = '';
1334      foreach ( $css_array as $css_item ) {
1335          if ( $css_item == '' )
1336              continue;
1337          $css_item = trim( $css_item );
1338          $found = false;
1339          if ( strpos( $css_item, ':' ) === false ) {
1340              $found = true;
1341          } else {
1342              $parts = explode( ':', $css_item );
1343              if ( in_array( trim( $parts[0] ), $allowed_attr ) )
1344                  $found = true;
1345          }
1346          if ( $found ) {
1347              if( $css != '' )
1348                  $css .= ';';
1349              $css .= $css_item;
1350          }
1351      }
1353      return $css;
1354  }

Generated: Wed Mar 12 01:00:59 2025 Cross-referenced by PHPXref 0.7.1