moriyoshi               Wed Mar  2 14:28:26 2005 EDT

  Added files:                 (Branch: PHP_5_0)
    /php-src/ext/xml/tests      bug32001.phpt 
  Log:
  - MFH
  
  
http://cvs.php.net/co.php/php-src/ext/xml/tests/bug32001.phpt?r=1.1&p=1
Index: php-src/ext/xml/tests/bug32001.phpt
+++ php-src/ext/xml/tests/bug32001.phpt
--TEST--
Bug #32001 (xml_parse*() goes into infinite loop when autodetection in effect)
--FILE--
<?php
class testcase {
        private $encoding;
        private $bom;
        private $prologue;
        private $tags;
        private $chunk_size;

        function testcase($enc, $chunk_size = 0, $bom = 0, $omit_prologue = 0) {
                $this->encoding = $enc;
                $this->chunk_size = $chunk_size;
                $this->bom = $bom;
                $this->prologue = !$omit_prologue;
                $this->tags = array();
        }

        function start_element($parser, $name, $attrs) {
                $attrs = array_map('bin2hex', $attrs);
                $this->tags[] = bin2hex($name).": ".implode(', ', $attrs);
        }

        function end_element($parser, $name) {
        }

        function run() {
                $data = '';

                if ($this->prologue) {
                        $canonical_name = preg_replace('/BE|LE/i', '', 
$this->encoding);
                        $data .= "<?xml version=\"1.0\" 
encoding=\"$canonical_name\" ?>\n";
                }

                $data .= <<<HERE
<テスト:テスト1 xmlns:テスト="http://www.example.com/テスト/"; 
テスト="テスト">
  <テスト:テスト2 テスト="テスト">
        <テスト:テスト3>
          test! 
        </テスト:テスト3>
  </テスト:テスト2>
</テスト:テスト1>
HERE;

                $data = iconv("UTF-8", $this->encoding, $data);

                if ($this->bom) {
                        switch (strtoupper($this->encoding)) {
                                case 'UTF-8':
                                case 'UTF8':
                                        $data = "\xef\xbb\xbf".$data;
                                        break;

                                case 'UTF-16':
                                case 'UTF16':
                                case 'UTF-16BE':
                                case 'UTF16BE':
                                case 'UCS-2':
                                case 'UCS2':
                                case 'UCS-2BE':
                                case 'UCS2BE':
                                        $data = "\xfe\xff".$data;
                                        break;

                                case 'UTF-16LE':
                                case 'UTF16LE':
                                case 'UCS-2LE':
                                case 'UCS2LE':
                                        $data = "\xff\xfe".$data;
                                        break;

                                case 'UTF-32':
                                case 'UTF32':
                                case 'UTF-32BE':
                                case 'UTF32BE':
                                case 'UCS-4':
                                case 'UCS4':
                                case 'UCS-4BE':
                                case 'UCS4BE':
                                        $data = "\x00\x00\xfe\xff".$data;
                                        break;

                                case 'UTF-32LE':
                                case 'UTF32LE':
                                case 'UCS-4LE':
                                case 'UCS4LE':
                                        $data = "\xff\xfe\x00\x00".$data;
                                        break;
                        }
                }

                $parser = xml_parser_create(NULL);
                xml_set_element_handler($parser, "start_element", 
"end_element");
                xml_set_object($parser, $this);

                if ($this->chunk_size == 0) {
                        $success = @xml_parse($parser, $data, true);
                } else {
                        for ($offset = 0; $offset < strlen($data);
                                        $offset += $this->chunk_size) {
                                $success = @xml_parse($parser, substr($data, 
$offset, $this->chunk_size), false);
                                if (!$success) {
                                        break;
                                }
                        }
                        if ($success) {
                                $success = @xml_parse($parser, "", true);
                        }
                }

                echo "Encoding: $this->encoding\n";
                echo "XML Prologue: ".($this->prologue ? 'present': 'not 
present'), "\n";
                echo "Chunk size: ".($this->chunk_size ? "$this->chunk_size 
byte(s)\n": "all data at once\n");
                echo "BOM: ".($this->bom ? 'prepended': 'not prepended'), "\n";

                if ($success) { 
                        var_dump($this->tags);
                } else {
                        echo "[Error] ", 
xml_error_string(xml_get_error_code($parser)), "\n";
                }
        }
}
$suite = array(
        new testcase("UTF-8",     0, 0, 0),
        new testcase("UTF-8",     0, 0, 1),
        new testcase("UTF-8",     0, 1, 0),
        new testcase("UTF-8",     0, 1, 1),
        new testcase("UTF-16BE",  0, 0, 0),
        new testcase("UTF-16BE",  0, 1, 0),
        new testcase("UTF-16BE",  0, 1, 1),
        new testcase("UTF-16LE",  0, 0, 0),
        new testcase("UTF-16LE",  0, 1, 0),
        new testcase("UTF-16LE",  0, 1, 1),
        new testcase("UTF-8",     1, 0, 0),
        new testcase("UTF-8",     1, 0, 1),
        new testcase("UTF-8",     1, 1, 0),
        new testcase("UTF-8",     1, 1, 1),
        new testcase("UTF-16BE",  1, 0, 0),
        new testcase("UTF-16BE",  1, 1, 0),
        new testcase("UTF-16BE",  1, 1, 1),
        new testcase("UTF-16LE",  1, 0, 0),
        new testcase("UTF-16LE",  1, 1, 0),
        new testcase("UTF-16LE",  1, 1, 1),
        new testcase("EUC-JP"  ,  0),
        new testcase("EUC-JP"  ,  1),
        new testcase("Shift_JIS", 0),
        new testcase("Shift_JIS", 1),
        new testcase("GB2312",    0),
        new testcase("GB2312",    1),
);

preg_match("/^libxml2 Version.*\$/im", `$_ENV[TEST_PHP_EXECUTABLE] -i`, $match);

echo $match[0], "\n";


foreach ($suite as $testcase) {
        $testcase->run();
}

// vim600: sts=4 sw=4 ts=4 encoding=UTF-8
?>
--EXPECTF--
libxml2 Version => %s
Encoding: UTF-8
XML Prologue: present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: not present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: present
Chunk size: all data at once
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: not present
Chunk size: all data at once
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16BE
XML Prologue: present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16BE
XML Prologue: present
Chunk size: all data at once
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16BE
XML Prologue: not present
Chunk size: all data at once
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16LE
XML Prologue: present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16LE
XML Prologue: present
Chunk size: all data at once
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16LE
XML Prologue: not present
Chunk size: all data at once
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: not present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: present
Chunk size: 1 byte(s)
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-8
XML Prologue: not present
Chunk size: 1 byte(s)
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16BE
XML Prologue: present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16BE
XML Prologue: present
Chunk size: 1 byte(s)
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16BE
XML Prologue: not present
Chunk size: 1 byte(s)
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16LE
XML Prologue: present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16LE
XML Prologue: present
Chunk size: 1 byte(s)
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: UTF-16LE
XML Prologue: not present
Chunk size: 1 byte(s)
BOM: prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: EUC-JP
XML Prologue: present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: EUC-JP
XML Prologue: present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: Shift_JIS
XML Prologue: present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: Shift_JIS
XML Prologue: present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: GB2312
XML Prologue: present
Chunk size: all data at once
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}
Encoding: GB2312
XML Prologue: present
Chunk size: 1 byte(s)
BOM: not prepended
array(3) {
  [0]=>
  string(128) "e38386e382b9e383883ae38386e382b9e3838831: 
687474703a2f2f7777772e6578616d706c652e636f6d2fe38386e382b9e383882f, 
e38386e382b9e38388"
  [1]=>
  string(60) "e38386e382b9e383883ae38386e382b9e3838832: e38386e382b9e38388"
  [2]=>
  string(42) "e38386e382b9e383883ae38386e382b9e3838833: "
}

-- 
PHP CVS Mailing List (http://www.php.net/)
To unsubscribe, visit: http://www.php.net/unsub.php

Reply via email to