Commit:    20eb33b3212bd6c17d73c569c7345ae23c04d3ef
Author:    Moriyoshi Koizumi <m...@mozo.jp>         Sun, 10 Feb 2013 15:04:23 
+0900
Parents:   3d9a31efdfbbc3d73b8c94649f38035277264151
Branches:  PHP-5.5

Link:       
http://git.php.net/?p=php-src.git;a=commitdiff;h=20eb33b3212bd6c17d73c569c7345ae23c04d3ef

Log:
mb_split() can now handle empty matches like preg_split() does.

Changed paths:
  M  ext/mbstring/php_mbregex.c
  A  ext/mbstring/tests/mb_split_empty_match.phpt
  M  ext/mbstring/tests/mb_split_variation1.phpt


Diff:
diff --git a/ext/mbstring/php_mbregex.c b/ext/mbstring/php_mbregex.c
index a572bd4..145ee0c 100644
--- a/ext/mbstring/php_mbregex.c
+++ b/ext/mbstring/php_mbregex.c
@@ -1055,7 +1055,7 @@ PHP_FUNCTION(mb_split)
        php_mb_regex_t *re;
        OnigRegion *regs = NULL;
        char *string;
-       OnigUChar *pos;
+       OnigUChar *pos, *chunk_pos;
        int string_len;
 
        int n, err;
@@ -1065,8 +1065,8 @@ PHP_FUNCTION(mb_split)
                RETURN_FALSE;
        } 
 
-       if (count == 0) {
-               count = 1;
+       if (count > 0) {
+               count--;
        }
 
        /* create regex pattern buffer */
@@ -1076,31 +1076,30 @@ PHP_FUNCTION(mb_split)
 
        array_init(return_value);
 
-       pos = (OnigUChar *)string;
+       chunk_pos = pos = (OnigUChar *)string;
        err = 0;
        regs = onig_region_new();
        /* churn through str, generating array entries as we go */
-       while ((--count != 0) &&
-                  (err = onig_search(re, (OnigUChar *)string, (OnigUChar 
*)(string + string_len), pos, (OnigUChar *)(string + string_len), regs, 0)) >= 
0) {
-               if (regs->beg[0] == regs->end[0]) {
-                       php_error_docref(NULL TSRMLS_CC, E_WARNING, "Empty 
regular expression");
+       while (count != 0 && (pos - (OnigUChar *)string) < string_len) {
+               int beg, end;
+               err = onig_search(re, (OnigUChar *)string, (OnigUChar *)(string 
+ string_len), pos, (OnigUChar *)(string + string_len), regs, 0);
+               if (err < 0) {
                        break;
                }
-
+               beg = regs->beg[0], end = regs->end[0];
                /* add it to the array */
-               if (regs->beg[0] < string_len && regs->beg[0] >= (pos - 
(OnigUChar *)string)) {
-                       add_next_index_stringl(return_value, (char *)pos, 
((OnigUChar *)(string + regs->beg[0]) - pos), 1);
+               if ((pos - (OnigUChar *)string) < end) {
+                       if (beg < string_len && beg >= (chunk_pos - (OnigUChar 
*)string)) {
+                               add_next_index_stringl(return_value, (char 
*)chunk_pos, ((OnigUChar *)(string + beg) - chunk_pos), 1);
+                               --count;
+                       } else {
+                               err = -2;
+                               break;
+                       }
+                       /* point at our new starting point */
+                       chunk_pos = pos = (OnigUChar *)string + end;
                } else {
-                       err = -2;
-                       break;
-               }
-               /* point at our new starting point */
-               n = regs->end[0];
-               if ((pos - (OnigUChar *)string) < n) {
-                       pos = (OnigUChar *)string + n;
-               }
-               if (count < 0) {
-                       count = 0;
+                       pos++;
                }
                onig_region_free(regs, 0);
        }
@@ -1117,9 +1116,9 @@ PHP_FUNCTION(mb_split)
        }
 
        /* otherwise we just have one last element to add to the array */
-       n = ((OnigUChar *)(string + string_len) - pos);
+       n = ((OnigUChar *)(string + string_len) - chunk_pos);
        if (n > 0) {
-               add_next_index_stringl(return_value, (char *)pos, n, 1);
+               add_next_index_stringl(return_value, (char *)chunk_pos, n, 1);
        } else {
                add_next_index_stringl(return_value, "", 0, 1);
        }
diff --git a/ext/mbstring/tests/mb_split_empty_match.phpt 
b/ext/mbstring/tests/mb_split_empty_match.phpt
new file mode 100644
index 0000000..df3a22c
--- /dev/null
+++ b/ext/mbstring/tests/mb_split_empty_match.phpt
@@ -0,0 +1,23 @@
+--TEST--
+mb_split() empty match
+--
+--SKIPIF--
+<?php
+extension_loaded('mbstring') or die('skip');
+function_exists('mb_split') or die("skip mb_split() is not available in this 
build");
+?>
+--FILE--
+<?php
+mb_regex_set_options('m');
+var_dump(mb_split('^', "a\nb\nc"));
+--EXPECT--
+array(3) {
+  [0]=>
+  string(2) "a
+"
+  [1]=>
+  string(2) "b
+"
+  [2]=>
+  string(1) "c"
+}
diff --git a/ext/mbstring/tests/mb_split_variation1.phpt 
b/ext/mbstring/tests/mb_split_variation1.phpt
index be3230e..b508049 100644
--- a/ext/mbstring/tests/mb_split_variation1.phpt
+++ b/ext/mbstring/tests/mb_split_variation1.phpt
@@ -156,16 +156,12 @@ array(1) {
 }
 
 -- Iteration 10 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
 }
 
 -- Iteration 11 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
@@ -178,8 +174,6 @@ array(1) {
 }
 
 -- Iteration 13 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
@@ -192,24 +186,18 @@ array(1) {
 }
 
 -- Iteration 15 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
 }
 
 -- Iteration 16 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
 }
 
 -- Iteration 17 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
@@ -240,16 +228,12 @@ array(1) {
 }
 
 -- Iteration 22 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
 }
 
 -- Iteration 23 --
-
-Warning: mb_split(): Empty regular expression in %s on line %d
 array(1) {
   [0]=>
   string(13) "a b c d e f g"
@@ -259,4 +243,4 @@ array(1) {
 
 Warning: mb_split() expects parameter 1 to be string, resource given in %s on 
line %d
 bool(false)
-Done
\ No newline at end of file
+Done


--
PHP CVS Mailing List (http://www.php.net/)
To unsubscribe, visit: http://www.php.net/unsub.php

Reply via email to