Blame view

vendor/symfony/css-selector/Parser/Tokenizer/TokenizerEscaping.php 1.96 KB
ad2e91f7   Mihail   move multyparser ...
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
  <?php
  
  /*
   * This file is part of the Symfony package.
   *
   * (c) Fabien Potencier <fabien@symfony.com>
   *
   * For the full copyright and license information, please view the LICENSE
   * file that was distributed with this source code.
   */
  
  namespace Symfony\Component\CssSelector\Parser\Tokenizer;
  
  /**
   * CSS selector tokenizer escaping applier.
   *
   * This component is a port of the Python cssselect library,
   * which is copyright Ian Bicking, @see https://github.com/SimonSapin/cssselect.
   *
   * @author Jean-François Simon <jeanfrancois.simon@sensiolabs.com>
   */
  class TokenizerEscaping
  {
      /**
       * @var TokenizerPatterns
       */
      private $patterns;
  
      /**
       * @param TokenizerPatterns $patterns
       */
      public function __construct(TokenizerPatterns $patterns)
      {
          $this->patterns = $patterns;
      }
  
      /**
       * @param string $value
       *
       * @return string
       */
      public function escapeUnicode($value)
      {
          $value = $this->replaceUnicodeSequences($value);
  
          return preg_replace($this->patterns->getSimpleEscapePattern(), '$1', $value);
      }
  
      /**
       * @param string $value
       *
       * @return string
       */
      public function escapeUnicodeAndNewLine($value)
      {
          $value = preg_replace($this->patterns->getNewLineEscapePattern(), '', $value);
  
          return $this->escapeUnicode($value);
      }
  
      /**
       * @param string $value
       *
       * @return string
       */
      private function replaceUnicodeSequences($value)
      {
          return preg_replace_callback($this->patterns->getUnicodeEscapePattern(), function ($match) {
              $c = hexdec($match[1]);
  
              if (0x80 > $c %= 0x200000) {
                  return chr($c);
              }
              if (0x800 > $c) {
                  return chr(0xC0 | $c >> 6).chr(0x80 | $c & 0x3F);
              }
              if (0x10000 > $c) {
                  return chr(0xE0 | $c >> 12).chr(0x80 | $c >> 6 & 0x3F).chr(0x80 | $c & 0x3F);
              }
          }, $value);
      }
  }