Search moodle.org's
Developer Documentation

See Release Notes

  • Bug fixes for general core bugs in 4.3.x will end 7 October 2024 (12 months).
  • Bug fixes for security issues in 4.3.x will end 21 April 2025 (18 months).
  • PHP version: minimum PHP 8.0.0 Note: minimum PHP version has increased since Moodle 4.1. PHP 8.2.x is supported too.
   1  <?php
   2  
   3  /**
   4   * Base class for all validating attribute definitions.
   5   *
   6   * This family of classes forms the core for not only HTML attribute validation,
   7   * but also any sort of string that needs to be validated or cleaned (which
   8   * means CSS properties and composite definitions are defined here too).
   9   * Besides defining (through code) what precisely makes the string valid,
  10   * subclasses are also responsible for cleaning the code if possible.
  11   */
  12  
  13  abstract class HTMLPurifier_AttrDef
  14  {
  15  
  16      /**
  17       * Tells us whether or not an HTML attribute is minimized.
  18       * Has no meaning in other contexts.
  19       * @type bool
  20       */
  21      public $minimized = false;
  22  
  23      /**
  24       * Tells us whether or not an HTML attribute is required.
  25       * Has no meaning in other contexts
  26       * @type bool
  27       */
  28      public $required = false;
  29  
  30      /**
  31       * Validates and cleans passed string according to a definition.
  32       *
  33       * @param string $string String to be validated and cleaned.
  34       * @param HTMLPurifier_Config $config Mandatory HTMLPurifier_Config object.
  35       * @param HTMLPurifier_Context $context Mandatory HTMLPurifier_Context object.
  36       */
  37      abstract public function validate($string, $config, $context);
  38  
  39      /**
  40       * Convenience method that parses a string as if it were CDATA.
  41       *
  42       * This method process a string in the manner specified at
  43       * <http://www.w3.org/TR/html4/types.html#h-6.2> by removing
  44       * leading and trailing whitespace, ignoring line feeds, and replacing
  45       * carriage returns and tabs with spaces.  While most useful for HTML
  46       * attributes specified as CDATA, it can also be applied to most CSS
  47       * values.
  48       *
  49       * @note This method is not entirely standards compliant, as trim() removes
  50       *       more types of whitespace than specified in the spec. In practice,
  51       *       this is rarely a problem, as those extra characters usually have
  52       *       already been removed by HTMLPurifier_Encoder.
  53       *
  54       * @warning This processing is inconsistent with XML's whitespace handling
  55       *          as specified by section 3.3.3 and referenced XHTML 1.0 section
  56       *          4.7.  However, note that we are NOT necessarily
  57       *          parsing XML, thus, this behavior may still be correct. We
  58       *          assume that newlines have been normalized.
  59       */
  60      public function parseCDATA($string)
  61      {
  62          $string = trim($string);
  63          $string = str_replace(array("\n", "\t", "\r"), ' ', $string);
  64          return $string;
  65      }
  66  
  67      /**
  68       * Factory method for creating this class from a string.
  69       * @param string $string String construction info
  70       * @return HTMLPurifier_AttrDef Created AttrDef object corresponding to $string
  71       */
  72      public function make($string)
  73      {
  74          // default implementation, return a flyweight of this object.
  75          // If $string has an effect on the returned object (i.e. you
  76          // need to overload this method), it is best
  77          // to clone or instantiate new copies. (Instantiation is safer.)
  78          return $this;
  79      }
  80  
  81      /**
  82       * Removes spaces from rgb(0, 0, 0) so that shorthand CSS properties work
  83       * properly. THIS IS A HACK!
  84       * @param string $string a CSS colour definition
  85       * @return string
  86       */
  87      protected function mungeRgb($string)
  88      {
  89          $p = '\s*(\d+(\.\d+)?([%]?))\s*';
  90  
  91          if (preg_match('/(rgba|hsla)\(/', $string)) {
  92              return preg_replace('/(rgba|hsla)\('.$p.','.$p.','.$p.','.$p.'\)/', '\1(\2,\5,\8,\11)', $string);
  93          }
  94  
  95          return preg_replace('/(rgb|hsl)\('.$p.','.$p.','.$p.'\)/', '\1(\2,\5,\8)', $string);
  96      }
  97  
  98      /**
  99       * Parses a possibly escaped CSS string and returns the "pure"
 100       * version of it.
 101       */
 102      protected function expandCSSEscape($string)
 103      {
 104          // flexibly parse it
 105          $ret = '';
 106          for ($i = 0, $c = strlen($string); $i < $c; $i++) {
 107              if ($string[$i] === '\\') {
 108                  $i++;
 109                  if ($i >= $c) {
 110                      $ret .= '\\';
 111                      break;
 112                  }
 113                  if (ctype_xdigit($string[$i])) {
 114                      $code = $string[$i];
 115                      for ($a = 1, $i++; $i < $c && $a < 6; $i++, $a++) {
 116                          if (!ctype_xdigit($string[$i])) {
 117                              break;
 118                          }
 119                          $code .= $string[$i];
 120                      }
 121                      // We have to be extremely careful when adding
 122                      // new characters, to make sure we're not breaking
 123                      // the encoding.
 124                      $char = HTMLPurifier_Encoder::unichr(hexdec($code));
 125                      if (HTMLPurifier_Encoder::cleanUTF8($char) === '') {
 126                          continue;
 127                      }
 128                      $ret .= $char;
 129                      if ($i < $c && trim($string[$i]) !== '') {
 130                          $i--;
 131                      }
 132                      continue;
 133                  }
 134                  if ($string[$i] === "\n") {
 135                      continue;
 136                  }
 137              }
 138              $ret .= $string[$i];
 139          }
 140          return $ret;
 141      }
 142  }
 143  
 144  // vim: et sw=4 sts=4