Blame view

vendor/ezyang/htmlpurifier/tests/HTMLPurifier/EntityParserTest.php 3.48 KB
70f4f18b   Administrator   first_commit
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
  <?php
  
  class HTMLPurifier_EntityParserTest extends HTMLPurifier_Harness
  {
  
      protected $EntityParser;
  
      public function setUp()
      {
          $this->EntityParser = new HTMLPurifier_EntityParser();
          $this->_entity_lookup = HTMLPurifier_EntityLookup::instance();
      }
  
      public function test_substituteNonSpecialEntities()
      {
          $char_theta = $this->_entity_lookup->table['theta'];
          $this->assertIdentical($char_theta,
              $this->EntityParser->substituteNonSpecialEntities('&theta;') );
          $this->assertIdentical('"',
              $this->EntityParser->substituteNonSpecialEntities('"') );
  
          // numeric tests, adapted from Feyd
          $args = array();
          $args[] = array(1114112,false     );
          $args[] = array(1114111,'F48FBFBF'); // 0x0010FFFF
          $args[] = array(1048576,'F4808080'); // 0x00100000
          $args[] = array(1048575,'F3BFBFBF'); // 0x000FFFFF
          $args[] = array(262144, 'F1808080'); // 0x00040000
          $args[] = array(262143, 'F0BFBFBF'); // 0x0003FFFF
          $args[] = array(65536,  'F0908080'); // 0x00010000
          $args[] = array(65535,  'EFBFBF'  ); // 0x0000FFFF
          $args[] = array(57344,  'EE8080'  ); // 0x0000E000
          $args[] = array(57343,  false     ); // 0x0000DFFF  these are ill-formed
          $args[] = array(56040,  false     ); // 0x0000DAE8  these are ill-formed
          $args[] = array(55296,  false     ); // 0x0000D800  these are ill-formed
          $args[] = array(55295,  'ED9FBF'  ); // 0x0000D7FF
          $args[] = array(53248,  'ED8080'  ); // 0x0000D000
          $args[] = array(53247,  'ECBFBF'  ); // 0x0000CFFF
          $args[] = array(4096,   'E18080'  ); // 0x00001000
          $args[] = array(4095,   'E0BFBF'  ); // 0x00000FFF
          $args[] = array(2048,   'E0A080'  ); // 0x00000800
          $args[] = array(2047,   'DFBF'    ); // 0x000007FF
          $args[] = array(128,    'C280'    ); // 0x00000080  invalid SGML char
          $args[] = array(127,    '7F'      ); // 0x0000007F  invalid SGML char
          $args[] = array(0,      '00'      ); // 0x00000000  invalid SGML char
  
          $args[] = array(20108,  'E4BA8C'  ); // 0x00004E8C
          $args[] = array(77,     '4D'      ); // 0x0000004D
          $args[] = array(66306,  'F0908C82'); // 0x00010302
          $args[] = array(1072,   'D0B0'    ); // 0x00000430
  
          foreach ($args as $arg) {
              $string = '&#' . $arg[0] . ';' . // decimal
                        '&#x' . dechex($arg[0]) . ';'; // hex
              $expect = '';
              if ($arg[1] !== false) {
                  // this is only for PHP 5, the below is PHP 5 and PHP 4
                  //$chars = str_split($arg[1], 2);
                  $chars = array();
                  // strlen must be called in loop because strings size changes
                  for ($i = 0; strlen($arg[1]) > $i; $i += 2) {
                      $chars[] = $arg[1][$i] . $arg[1][$i+1];
                  }
                  foreach ($chars as $char) {
                      $expect .= chr(hexdec($char));
                  }
                  $expect .= $expect; // double it
              }
              $this->assertIdentical(
                  $this->EntityParser->substituteNonSpecialEntities($string),
                  $expect,
                  'Identical expectation [Hex: '. dechex($arg[0]) .']'
              );
          }
  
      }
  
      public function test_substituteSpecialEntities()
      {
          $this->assertIdentical(
              "'",
              $this->EntityParser->substituteSpecialEntities('&#39;')
          );
      }
  
  }
  
  // vim: et sw=4 sts=4