--TEST-- Bug #32001 (xml_parse*() goes into infinite loop when autodetection in effect), using EUC-JP, Shift_JIS, GB2312 --SKIPIF-- --FILE-- encoding = $enc; $this->chunk_size = $chunk_size; $this->bom = $bom; $this->prologue = !$omit_prologue; $this->tags = array(); } function start_element($parser, $name, $attrs) { $attrs = array_map('bin2hex', $attrs); $this->tags[] = bin2hex($name).": ".implode(', ', $attrs); } function end_element($parser, $name) { } function run() { $data = ''; if ($this->prologue) { $canonical_name = preg_replace('/BE|LE/i', '', $this->encoding); $data .= "\n"; } $data .= << <テスト:テスト2 テスト="テスト"> <テスト:テスト3> test! HERE; $data = iconv("UTF-8", $this->encoding, $data); $parser = xml_parser_create(NULL); xml_parser_set_option($parser, XML_OPTION_CASE_FOLDING, 0); xml_set_element_handler($parser, "start_element", "end_element"); xml_set_object($parser, $this); if ($this->chunk_size == 0) { $success = @xml_parse($parser, $data, true); } else { for ($offset = 0; $offset < strlen($data); $offset += $this->chunk_size) { $success = @xml_parse($parser, substr($data, $offset, $this->chunk_size), false); if (!$success) { break; } } if ($success) { $success = @xml_parse($parser, "", true); } } echo "Encoding: $this->encoding\n"; echo "XML Prologue: ".($this->prologue ? 'present': 'not present'), "\n"; echo "Chunk size: ".($this->chunk_size ? "$this->chunk_size byte(s)\n": "all data at once\n"); echo "BOM: ".($this->bom ? 'prepended': 'not prepended'), "\n"; if ($success) { var_dump($this->tags); } else { echo "[Error] ", xml_error_string(xml_get_error_code($parser)), "\n"; } } } $suite = array( new testcase("EUC-JP" , 0), new testcase("EUC-JP" , 1), new testcase("Shift_JIS", 0), new testcase("Shift_JIS", 1), new testcase("GB2312", 0), new testcase("GB2312", 1), ); if (XML_SAX_IMPL == 'libxml') { $php = getenv('TEST_PHP_EXECUTABLE'); preg_match("/^libxml2 Version.*\$/im", `$php -i`, $match); echo $match[0], "\n"; } else { echo "libxml2 Version => NONE\n"; } foreach ($suite as $testcase) { $testcase->run(); } // vim600: sts=4 sw=4 ts=4 encoding=UTF-8 ?> --EXPECTF-- libxml2 Version => %s Encoding: EUC-JP XML Prologue: present Chunk size: all data at once BOM: not prepended array(3) { [0]=> string(128) "e38386e382b9e383883ae38386e382b9e3838831: 687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, e38386e382b9e38388" [1]=> string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388" [2]=> string(42) "e38386e382b9e383883ae38386e382b9e3838833: " } Encoding: EUC-JP XML Prologue: present Chunk size: 1 byte(s) BOM: not prepended array(3) { [0]=> string(128) "e38386e382b9e383883ae38386e382b9e3838831: 687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, e38386e382b9e38388" [1]=> string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388" [2]=> string(42) "e38386e382b9e383883ae38386e382b9e3838833: " } Encoding: Shift_JIS XML Prologue: present Chunk size: all data at once BOM: not prepended array(3) { [0]=> string(128) "e38386e382b9e383883ae38386e382b9e3838831: 687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, e38386e382b9e38388" [1]=> string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388" [2]=> string(42) "e38386e382b9e383883ae38386e382b9e3838833: " } Encoding: Shift_JIS XML Prologue: present Chunk size: 1 byte(s) BOM: not prepended array(3) { [0]=> string(128) "e38386e382b9e383883ae38386e382b9e3838831: 687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, e38386e382b9e38388" [1]=> string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388" [2]=> string(42) "e38386e382b9e383883ae38386e382b9e3838833: " } Encoding: GB2312 XML Prologue: present Chunk size: all data at once BOM: not prepended array(3) { [0]=> string(128) "e38386e382b9e383883ae38386e382b9e3838831: 687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, e38386e382b9e38388" [1]=> string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388" [2]=> string(42) "e38386e382b9e383883ae38386e382b9e3838833: " } Encoding: GB2312 XML Prologue: present Chunk size: 1 byte(s) BOM: not prepended array(3) { [0]=> string(128) "e38386e382b9e383883ae38386e382b9e3838831: 687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, e38386e382b9e38388" [1]=> string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388" [2]=> string(42) "e38386e382b9e383883ae38386e382b9e3838833: " }