Author: lupus
Date: 2007-10-26 13:29:26 -0400 (Fri, 26 Oct 2007)
New Revision: 88278
Modified:
trunk/mono/mono/metadata/ChangeLog
trunk/mono/mono/metadata/appdomain.c
trunk/mono/mono/metadata/string-icalls.c
trunk/mono/mono/metadata/string-icalls.h
Log:
Fri Oct 26 19:38:40 CEST 2007 Paolo Molaro <[EMAIL PROTECTED]>
* string-icalls.c, string-icalls.h, appdomain.c: patch from
Tyler Larson <[EMAIL PROTECTED]> to fix the handling of
RemoveEmptyEntries in the string.Split implementation (bug #322375).
Modified: trunk/mono/mono/metadata/ChangeLog
===================================================================
--- trunk/mono/mono/metadata/ChangeLog 2007-10-26 17:29:18 UTC (rev 88277)
+++ trunk/mono/mono/metadata/ChangeLog 2007-10-26 17:29:26 UTC (rev 88278)
@@ -1,3 +1,10 @@
+
+Fri Oct 26 19:38:40 CEST 2007 Paolo Molaro <[EMAIL PROTECTED]>
+
+ * string-icalls.c, string-icalls.h, appdomain.c: patch from
+ Tyler Larson <[EMAIL PROTECTED]> to fix the handling of
+ RemoveEmptyEntries in the string.Split implementation (bug #322375).
+
2007-10-26 Dick Porter <[EMAIL PROTECTED]>
* appdomain.c (MONO_CORLIB_VERSION): Bump version because of
Modified: trunk/mono/mono/metadata/appdomain.c
===================================================================
--- trunk/mono/mono/metadata/appdomain.c 2007-10-26 17:29:18 UTC (rev
88277)
+++ trunk/mono/mono/metadata/appdomain.c 2007-10-26 17:29:26 UTC (rev
88278)
@@ -44,7 +44,7 @@
#include <direct.h>
#endif
-#define MONO_CORLIB_VERSION 59
+#define MONO_CORLIB_VERSION 60
typedef struct
{
Modified: trunk/mono/mono/metadata/string-icalls.c
===================================================================
--- trunk/mono/mono/metadata/string-icalls.c 2007-10-26 17:29:18 UTC (rev
88277)
+++ trunk/mono/mono/metadata/string-icalls.c 2007-10-26 17:29:26 UTC (rev
88278)
@@ -97,8 +97,14 @@
memcpy(destptr, src + sindex, sizeof(gunichar2) * count);
}
+/* System.StringSplitOptions */
+typedef enum {
+ STRINGSPLITOPTIONS_NONE = 0,
+ STRINGSPLITOPTIONS_REMOVE_EMPTY_ENTRIES = 1
+} StringSplitOptions;
+
MonoArray *
-ves_icall_System_String_InternalSplit (MonoString *me, MonoArray *separator,
gint32 count)
+ves_icall_System_String_InternalSplit (MonoString *me, MonoArray *separator,
gint32 count, gint32 options)
{
MonoString * tmpstr;
MonoArray * retarr;
@@ -106,65 +112,134 @@
gint32 arrsize, srcsize, splitsize;
gint32 i, lastpos, arrpos;
gint32 tmpstrsize;
+ gint32 remempty;
+ gint32 flag;
gunichar2 *tmpstrptr;
- gunichar2 cmpchar;
+ remempty = options & STRINGSPLITOPTIONS_REMOVE_EMPTY_ENTRIES;
+ src = mono_string_chars (me);
+ srcsize = mono_string_length (me);
+ arrsize = mono_array_length (separator);
- MONO_ARCH_SAVE_REGS;
+ splitsize = 1;
+ /* Count the number of elements we will return. Note that this operation
+ * guarantees that we will return exactly splitsize elements, and we
will
+ * have enough data to fill each. This allows us to skip some checks
later on.
+ */
+ if (remempty == 0) {
+ for (i = 0; i != srcsize && splitsize < count; i++) {
+ if (string_icall_is_in_array (separator, arrsize, src
[i]))
+ splitsize++;
+ }
+ } else if (count > 1) {
+ /* Require pattern "Nondelim + Delim + Nondelim" to increment
counter.
+ * Lastpos != 0 means first nondelim found.
+ * Flag = 0 means last char was delim.
+ * Efficient, though perhaps confusing.
+ */
+ lastpos = 0;
+ flag = 0;
+ for (i = 0; i != srcsize && splitsize < count; i++) {
+ if (string_icall_is_in_array (separator, arrsize, src
[i])) {
+ flag = 0;
+ } else if (flag == 0) {
+ if (lastpos == 1)
+ splitsize++;
+ flag = 1;
+ lastpos = 1;
+ }
+ }
- src = mono_string_chars(me);
- srcsize = mono_string_length(me);
- arrsize = mono_array_length(separator);
+ /* Nothing but separators */
+ if (lastpos == 0) {
+ retarr = mono_array_new (mono_domain_get (),
mono_get_string_class (), 0);
+ return retarr;
+ }
+ }
- cmpchar = mono_array_get(separator, gunichar2, 0);
+ /* if no split chars found return the string */
+ if (splitsize == 1) {
+ if (remempty == 0 || count == 1) {
+ /* Copy the whole string */
+ retarr = mono_array_new (mono_domain_get (),
mono_get_string_class (), 1);
+ mono_array_setref (retarr, 0, me);
+ } else {
+ /* otherwise we have to filter out leading & trailing
delims */
- splitsize = 0;
- for (i = 0; i != srcsize && splitsize < count; i++) {
- if (string_icall_is_in_array(separator, arrsize, src[i]))
- splitsize++;
+ /* find first non-delim char */
+ for (; srcsize != 0; srcsize--, src++) {
+ if (!string_icall_is_in_array (separator,
arrsize, src [0]))
+ break;
+ }
+ /* find last non-delim char */
+ for (; srcsize != 0; srcsize--) {
+ if (!string_icall_is_in_array (separator,
arrsize, src [srcsize - 1]))
+ break;
+ }
+ tmpstr = mono_string_new_size (mono_domain_get (),
srcsize);
+ tmpstrptr = mono_string_chars (tmpstr);
+
+ memcpy (tmpstrptr, src, srcsize * sizeof (gunichar2));
+ retarr = mono_array_new (mono_domain_get (),
mono_get_string_class (), 1);
+ mono_array_setref (retarr, 0, tmpstr);
+ }
+ return retarr;
}
lastpos = 0;
arrpos = 0;
+
+ retarr = mono_array_new (mono_domain_get (), mono_get_string_class (),
splitsize);
- /* if no split chars found return the string */
- if (splitsize == 0) {
- retarr = mono_array_new(mono_domain_get(),
mono_get_string_class (), 1);
- mono_array_setref (retarr, 0, me);
+ for (i = 0; i != srcsize && arrpos != splitsize; i++) {
+ if (string_icall_is_in_array (separator, arrsize, src [i])) {
+
+ if (lastpos != i || remempty == 0) {
+ tmpstrsize = i - lastpos;
+ tmpstr = mono_string_new_size (mono_domain_get
(), tmpstrsize);
+ tmpstrptr = mono_string_chars (tmpstr);
- return retarr;
- }
+ memcpy (tmpstrptr, src + lastpos, tmpstrsize *
sizeof (gunichar2));
+ mono_array_setref (retarr, arrpos, tmpstr);
+ arrpos++;
- if (splitsize != count)
- splitsize++;
+ if (arrpos == splitsize - 1) {
+ /* Shortcut the last array element */
- retarr = mono_array_new(mono_domain_get(), mono_get_string_class (),
splitsize);
- for (i = 0; i != srcsize && arrpos != count; i++) {
- if (string_icall_is_in_array(separator, arrsize, src[i])) {
- if (arrpos == count - 1)
- tmpstrsize = srcsize - lastpos;
- else
- tmpstrsize = i - lastpos;
+ lastpos = i + 1;
+ if (remempty != 0) {
+ /* Search for non-delim
starting char (guaranteed to find one) Note that loop
+ * condition is only there for
safety. It will never actually terminate the loop. */
+ for (; lastpos != srcsize ;
lastpos++) {
+ if
(!string_icall_is_in_array (separator, arrsize, src [lastpos]))
+ break;
+ }
+ if (count > splitsize) {
+ /* Since we have fewer
results than our limit, we must remove
+ * trailing delimiters
as well.
+ */
+ for (; srcsize !=
lastpos + 1 ; srcsize--) {
+ if
(!string_icall_is_in_array (separator, arrsize, src [srcsize - 1]))
+ break;
+ }
+ }
+ }
- tmpstr = mono_string_new_size( mono_domain_get (),
tmpstrsize);
- tmpstrptr = mono_string_chars(tmpstr);
+ tmpstrsize = srcsize - lastpos;
+ tmpstr = mono_string_new_size
(mono_domain_get (), tmpstrsize);
+ tmpstrptr = mono_string_chars (tmpstr);
- memcpy(tmpstrptr, src + lastpos, tmpstrsize *
sizeof(gunichar2));
- mono_array_setref (retarr, arrpos, tmpstr);
- arrpos++;
+ memcpy (tmpstrptr, src + lastpos,
tmpstrsize * sizeof (gunichar2));
+ mono_array_setref (retarr, arrpos,
tmpstr);
+
+ /* Loop will ALWAYS end here. Test
criteria in the FOR loop is technically unnecessary. */
+ break;
+ }
+ }
lastpos = i + 1;
}
}
- if (arrpos < count) {
- tmpstrsize = srcsize - lastpos;
- tmpstr = mono_string_new_size( mono_domain_get (), tmpstrsize);
- tmpstrptr = mono_string_chars(tmpstr);
-
- memcpy(tmpstrptr, src + lastpos, tmpstrsize *
sizeof(gunichar2));
- mono_array_setref (retarr, arrpos, tmpstr);
- }
-
return retarr;
}
Modified: trunk/mono/mono/metadata/string-icalls.h
===================================================================
--- trunk/mono/mono/metadata/string-icalls.h 2007-10-26 17:29:18 UTC (rev
88277)
+++ trunk/mono/mono/metadata/string-icalls.h 2007-10-26 17:29:26 UTC (rev
88278)
@@ -24,7 +24,7 @@
ves_icall_System_String_InternalCopyTo (MonoString *me, gint32 sindex,
MonoArray *dest, gint32 dindex, gint32 count) MONO_INTERNAL;
MonoArray *
-ves_icall_System_String_InternalSplit (MonoString *me, MonoArray *separator,
gint32 count) MONO_INTERNAL;
+ves_icall_System_String_InternalSplit (MonoString *me, MonoArray *separator,
gint32 count, gint32 options) MONO_INTERNAL;
MonoString *
ves_icall_System_String_InternalTrim (MonoString *me, MonoArray *chars, gint32
typ) MONO_INTERNAL;
_______________________________________________
Mono-patches maillist - [email protected]
http://lists.ximian.com/mailman/listinfo/mono-patches