Hello all.
Attached is the patch which adds Unicode support to *printf() functions stack.
We (Andrei and me) made several assumptions that are worth mentioning:
sprintf() and vsprintf():
- use runtime_encoding when dealing with Unicode data.
printf() and vprintf():
- the result data is converted to output_encoding when formatting is done;
- return _number of bytes_ outputted.
fprintf() and vfprintf():
- use runtime_encoding, as all conversions are done by underlying streams API;
- both functions return the number returned by streams API (which seems to be
number of bytes).
I did not run any benchmarks yet, but I don't expect it to cause any major
slowdown.
I would like to hear your comments before applying the patch, so don't hesitate
to post them.
--
Wbr,
Antony Dovgal
Index: ext/standard/formatted_print.c
===================================================================
RCS file: /repository/php-src/ext/standard/formatted_print.c,v
retrieving revision 1.88
diff -u -p -d -r1.88 formatted_print.c
--- ext/standard/formatted_print.c 7 Dec 2006 20:45:21 -0000 1.88
+++ ext/standard/formatted_print.c 11 Dec 2006 22:44:21 -0000
@@ -40,6 +40,9 @@
#define MAX_FLOAT_DIGITS 38
#define MAX_FLOAT_PRECISION 40
+#define PHP_OUTPUT 0
+#define PHP_RUNTIME 1
+
#if 0
/* trick to control varargs functions through cpp */
# define PRINTF_DEBUG(arg) php_printf arg
@@ -50,7 +53,10 @@
static char hexchars[] = "0123456789abcdef";
static char HEXCHARS[] = "0123456789ABCDEF";
+static UChar u_hexchars[] = {0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
0x38, 0x39, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66};
+static UChar u_HEXCHARS[] = {0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
0x38, 0x39, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46};
+/* php_sprintf_appendchar() {{{ */
inline static void
php_sprintf_appendchar(char **buffer, int *pos, int *size, char add TSRMLS_DC)
{
@@ -62,8 +68,21 @@ php_sprintf_appendchar(char **buffer, in
PRINTF_DEBUG(("sprintf: appending '%c', pos=\n", add, *pos));
(*buffer)[(*pos)++] = add;
}
+/* }}} */
+/* php_u_sprintf_appendchar() {{{ */
+inline static void
+php_u_sprintf_appendchar(UChar **buffer, int *pos, int *size, UChar add
TSRMLS_DC)
+{
+ if ((*pos + 1) >= *size) {
+ *size <<= 1;
+ *buffer = eurealloc(*buffer, *size);
+ }
+ (*buffer)[(*pos)++] = add;
+}
+/* }}} */
+/* php_sprintf_appendstring() {{{ */
inline static void
php_sprintf_appendstring(char **buffer, int *pos, int *size, char *add,
int min_width, int
max_width, char padding,
@@ -112,10 +131,57 @@ php_sprintf_appendstring(char **buffer,
}
}
}
+/* }}} */
+/* php_u_sprintf_appendstring() {{{ */
+inline static void
+php_u_sprintf_appendstring(UChar **buffer, int *pos, int *size, UChar *add,
+ int min_width, int
max_width, UChar padding,
+ int alignment, int len, int
neg, int expprec, int always_sign)
+{
+ register int npad;
+ int req_size;
+ int copy_len;
+
+ copy_len = (expprec ? MIN(max_width, len) : len);
+ npad = min_width - copy_len;
+
+ if (npad < 0) {
+ npad = 0;
+ }
+
+ req_size = *pos + MAX(min_width, copy_len) + 1;
+
+ if (req_size > *size) {
+ while (req_size > *size) {
+ *size <<= 1;
+ }
+ *buffer = eurealloc(*buffer, *size);
+ }
+ if (alignment == ALIGN_RIGHT) {
+ if ((neg || always_sign) && padding == 0x30 /* '0' */) {
+ (*buffer)[(*pos)++] = (neg) ? 0x2D /* '-' */ : 0x2B /*
'+' */;
+ add++;
+ len--;
+ copy_len--;
+ }
+ while (npad-- > 0) {
+ (*buffer)[(*pos)++] = padding;
+ }
+ }
+ u_memcpy(&(*buffer)[*pos], add, copy_len + 1);
+ *pos += copy_len;
+ if (alignment == ALIGN_LEFT) {
+ while (npad--) {
+ (*buffer)[(*pos)++] = padding;
+ }
+ }
+}
+/* }}} */
+/* php_sprintf_appendint() {{{ */
inline static void
-php_sprintf_appendint(char **buffer, int *pos, int *size, long number,
+php_sprintf_appendint(char **buffer, int *pos, int *size, long number,
int width, char padding, int
alignment,
int always_sign)
{
@@ -155,7 +221,49 @@ php_sprintf_appendint(char **buffer, int
padding, alignment,
(NUM_BUF_SIZE - 1) - i,
neg, 0, always_sign);
}
+/* }}} */
+/* php_u_sprintf_appendint() {{{ */
+inline static void
+php_u_sprintf_appendint(UChar **buffer, int *pos, int *size, long number,
+ int width, UChar padding, int
alignment,
+ int always_sign)
+{
+ UChar numbuf[NUM_BUF_SIZE];
+ register unsigned long magn, nmagn;
+ register unsigned int i = NUM_BUF_SIZE - 1, neg = 0;
+
+ if (number < 0) {
+ neg = 1;
+ magn = ((unsigned long) -(number + 1)) + 1;
+ } else {
+ magn = (unsigned long) number;
+ }
+
+ /* Can't right-pad 0's on integers */
+ if (alignment==0 && padding== 0x30 /* '0' */) padding = 0x20 /* ' ' */;
+
+ numbuf[i] = 0x0A /* '\0' */;
+
+ do {
+ nmagn = magn / 10;
+
+ numbuf[--i] = (UChar)(magn - (nmagn * 10)) + 0x30 /* '0' */;
+ magn = nmagn;
+ }
+ while (magn > 0 && i > 0);
+ if (neg) {
+ numbuf[--i] = 0x2D /* '-' */;
+ } else if (always_sign) {
+ numbuf[--i] = 0x2B /* '+' */;
+ }
+ php_u_sprintf_appendstring(buffer, pos, size, &numbuf[i], width, 0,
+ padding, alignment,
(NUM_BUF_SIZE - 1) - i,
+ neg, 0, always_sign);
+}
+/* }}} */
+
+/* php_sprintf_appenduint() {{{ */
inline static void
php_sprintf_appenduint(char **buffer, int *pos, int *size,
unsigned long number,
@@ -185,7 +293,38 @@ php_sprintf_appenduint(char **buffer, in
php_sprintf_appendstring(buffer, pos, size, &numbuf[i], width, 0,
padding, alignment,
(NUM_BUF_SIZE - 1) - i, 0, 0, 0);
}
+/* }}} */
+/* php_u_sprintf_appenduint() {{{ */
+inline static void
+php_u_sprintf_appenduint(UChar **buffer, int *pos, int *size,
+ unsigned long number,
+ int width, UChar padding, int
alignment)
+{
+ UChar numbuf[NUM_BUF_SIZE];
+ register unsigned long magn, nmagn;
+ register unsigned int i = NUM_BUF_SIZE - 1;
+
+ magn = (unsigned int) number;
+
+ /* Can't right-pad 0's on integers */
+ if (alignment == 0 && padding == 0x30 /* '0' */) padding = 0x20 /* ' '
*/;
+
+ numbuf[i] = 0x0A /* '\0' */;
+
+ do {
+ nmagn = magn / 10;
+
+ numbuf[--i] = (UChar)(magn - (nmagn * 10)) + 0x30 /* '0' */;
+ magn = nmagn;
+ } while (magn > 0 && i > 0);
+
+ php_u_sprintf_appendstring(buffer, pos, size, &numbuf[i], width, 0,
+ padding, alignment,
(NUM_BUF_SIZE - 1) - i, 0, 0, 0);
+}
+/* }}} */
+
+/* php_sprintf_appenddouble() {{{ */
inline static void
php_sprintf_appenddouble(char **buffer, int *pos,
int *size, double number,
@@ -231,7 +370,7 @@ php_sprintf_appenddouble(char **buffer,
}
case 'E':
case 'f':
- s = ap_php_conv_fp(fmt, number, 0, precision,
+ s = ap_php_conv_fp(fmt, number, NO, precision,
&is_negative, &num_buf[1],
&s_len);
if (is_negative) {
num_buf[0] = '-';
@@ -272,8 +411,122 @@ php_sprintf_appenddouble(char **buffer,
php_sprintf_appendstring(buffer, pos, size, s, width, 0, padding,
alignment, s_len,
is_negative, 0, always_sign);
}
+/* }}} */
+
+/* php_u_sprintf_appenddouble() {{{ */
+inline static void
+php_u_sprintf_appenddouble(UChar **buffer, int *pos,
+ int *size, double number,
+ int width, UChar padding,
+ int alignment, int precision,
+ int adjust, UChar fmt,
+ int always_sign
+ TSRMLS_DC)
+{
+ char num_buf[NUM_BUF_SIZE];
+ char *s = NULL, *q, s_fmt;
+ UChar *uni_s;
+ int s_len = 0, is_negative = 0;
+
+ if ((adjust & ADJ_PRECISION) == 0) {
+ precision = FLOAT_PRECISION;
+ } else if (precision > MAX_FLOAT_PRECISION) {
+ precision = MAX_FLOAT_PRECISION;
+ }
+
+ if (zend_isnan(number)) {
+ UChar *nan = USTR_MAKE("NaN");
+ is_negative = (number<0);
+ php_u_sprintf_appendstring(buffer, pos, size, nan, 3, 0,
padding,
+ alignment,
precision, is_negative, 0, always_sign);
+ efree(nan);
+ return;
+ }
+
+ if (zend_isinf(number)) {
+ UChar *inf = USTR_MAKE("INF");
+ is_negative = (number<0);
+ php_u_sprintf_appendstring(buffer, pos, size, inf, 3, 0,
padding,
+ alignment,
precision, is_negative, 0, always_sign);
+ efree(inf);
+ return;
+ }
+
+ switch (fmt) {
+ case 0x66 /* 'f' */:
+ case 0x46 /* 'F' */:
+ s_fmt = 'f';
+ break;
+ case 0x65 /* 'e' */:
+ s_fmt = 'e';
+ break;
+ case 0x45 /* 'E' */:
+ s_fmt = 'E';
+ break;
+ case 0x67 /* 'g' */:
+ s_fmt = 'g';
+ break;
+ case 0x47 /* 'G' */:
+ s_fmt = 'G';
+ break;
+ }
+
+ switch (fmt) {
+ case 0x46 /* 'F' */:
+ /* break is missing */
+ case 0x65 /* 'e' */:
+ if (precision) {
+ precision--;
+ }
+ case 0x45 /* 'E' */:
+ case 0x66 /* 'f' */:
+ s = ap_php_conv_fp(s_fmt, number, NO, precision,
+ &is_negative, &num_buf[1],
&s_len);
+ if (is_negative) {
+ num_buf[0] = '-';
+ s = num_buf;
+ s_len++;
+ } else if (always_sign) {
+ num_buf[0] = '+';
+ s = num_buf;
+ s_len++;
+ }
+ s[s_len] = '\0';
+ break;
+
+ case 0x67 /* 'g' */:
+ case 0x47 /* 'G' */:
+ if (precision == 0)
+ precision = 1;
+ /*
+ * * We use &num_buf[ 1 ], so that we have room for the
sign
+ */
+ s = bsd_gcvt(number, precision, &num_buf[1]);
+ is_negative = 0;
+ if (*s == '-') {
+ is_negative = 1;
+ s = &num_buf[1];
+ } else if (always_sign) {
+ num_buf[0] = '+';
+ s = num_buf;
+ }
+
+ s_len = strlen(s);
+
+ if (fmt == 0x47 /* 'G' */ && (q = strchr(s, 'e')) !=
NULL) {
+ *q = 'E';
+ }
+ break;
+ }
+ uni_s = zend_ascii_to_unicode(s, s_len + 1 ZEND_FILE_LINE_CC);
+ php_u_sprintf_appendstring(buffer, pos, size, uni_s, width, 0, padding,
+ alignment, s_len,
is_negative, 0, always_sign);
+ efree(uni_s);
+}
+/* }}} */
+/* php_sprintf_append2n() {{{ */
inline static void
php_sprintf_append2n(char **buffer, int *pos, int *size, long number,
int width, char padding, int
alignment, int n,
@@ -302,8 +555,35 @@ php_sprintf_append2n(char **buffer, int
padding, alignment,
(NUM_BUF_SIZE - 1) - i,
0, expprec, 0);
}
+/* }}} */
+/* php_u_sprintf_append2n() {{{ */
+inline static void
+php_u_sprintf_append2n(UChar **buffer, int *pos, int *size, long number,
+ int width, UChar padding, int
alignment, int n,
+ UChar *chartable, int expprec)
+{
+ UChar numbuf[NUM_BUF_SIZE];
+ register unsigned long num;
+ register unsigned int i = NUM_BUF_SIZE - 1;
+ register int andbits = (1 << n) - 1;
+ num = (unsigned long) number;
+ numbuf[i] = '\0';
+
+ do {
+ numbuf[--i] = chartable[(num & andbits)];
+ num >>= n;
+ }
+ while (num > 0);
+
+ php_u_sprintf_appendstring(buffer, pos, size, &numbuf[i], width, 0,
+ padding, alignment,
(NUM_BUF_SIZE - 1) - i,
+ 0, expprec, 0);
+}
+/* }}} */
+
+/* php_sprintf_getnumber() {{{ */
inline static long
php_sprintf_getnumber(char *buffer, int *pos)
{
@@ -318,8 +598,25 @@ php_sprintf_getnumber(char *buffer, int
*pos += i;
return num;
}
+/* }}} */
-/* {{{ php_formatted_print
+/* php_u_sprintf_getnumber() {{{ */
+inline static long
+php_u_sprintf_getnumber(UChar *buffer, int *pos)
+{
+ UChar *endptr;
+ register long num = zend_u_strtol(&buffer[*pos], &endptr, 10);
+ register int i = 0;
+
+ if (endptr != NULL) {
+ i = (endptr - &buffer[*pos]);
+ }
+ *pos += i;
+ return num;
+}
+/* }}} */
+
+/* {{{ php_formatted_print()
* New sprintf implementation for PHP.
*
* Modifiers:
@@ -343,8 +640,7 @@ php_sprintf_getnumber(char *buffer, int
* "X" integer argument is printed as uppercase hexadecimal
*
*/
-static char *
-php_formatted_print(int ht, int *len, int use_array, int format_offset
TSRMLS_DC)
+static char * php_formatted_print(int ht, int *len, int use_array, int
format_offset, int type TSRMLS_DC)
{
zval ***args, **z_format;
int argc, size = 240, inpos = 0, outpos = 0, temppos;
@@ -518,9 +814,26 @@ php_formatted_print(int ht, int *len, in
switch (format[inpos]) {
case 's': {
zval *var, var_copy;
- int use_copy;
+ int use_copy = 0;
- zend_make_printable_zval(tmp,
&var_copy, &use_copy);
+ if (Z_TYPE_P(tmp) != IS_UNICODE) {
+ zend_make_printable_zval(tmp,
&var_copy, &use_copy);
+ } else {
+ var_copy = *tmp;
+ zval_copy_ctor(&var_copy);
+ INIT_PZVAL(&var_copy);
+ use_copy = 1;
+
+ switch (type) {
+ case PHP_OUTPUT:
+
convert_to_string_with_converter(&var_copy,
ZEND_U_CONVERTER(UG(output_encoding_conv)));
+ break;
+ case PHP_RUNTIME:
+ default:
+
convert_to_string_with_converter(&var_copy,
ZEND_U_CONVERTER(UG(runtime_encoding_conv)));
+ break;
+ }
+ }
if (use_copy) {
var = &var_copy;
} else {
@@ -559,7 +872,6 @@ php_formatted_print(int ht, int *len, in
case 'E':
case 'f':
case 'F':
- /* XXX not done */
convert_to_double(tmp);
php_sprintf_appenddouble(&result,
&outpos, &size,
Z_DVAL_P(tmp),
@@ -630,17 +942,323 @@ php_formatted_print(int ht, int *len, in
}
/* }}} */
+/* php_u_formatted_print() {{{ */
+static zstr php_u_formatted_print(int ht, int *len, int use_array, int
format_offset, int type TSRMLS_DC)
+{
+ zval ***args, **z_format;
+ int argc, size = 240, inpos = 0, outpos = 0, temppos;
+ int alignment, width, precision, currarg, adjusting, argnum;
+ UChar *format, *result, padding;
+ int always_sign;
+ zstr result_str;
+
+ argc = ZEND_NUM_ARGS();
+
+ /* verify the number of args */
+ if ((use_array && argc != (2 + format_offset))
+ || (!use_array && argc < (1 + format_offset))) {
+ WRONG_PARAM_COUNT_WITH_RETVAL(NULL_ZSTR);
+ }
+ args = (zval ***)safe_emalloc(argc, sizeof(zval *), 0);
+
+ if (zend_get_parameters_array_ex(argc, args) == FAILURE) {
+ efree(args);
+ WRONG_PARAM_COUNT_WITH_RETVAL(NULL_ZSTR);
+ }
+
+ if (use_array) {
+ int i = 1;
+ zval ***newargs;
+ zval **array;
+
+ z_format = args[format_offset];
+ array = args[1 + format_offset];
+
+ SEPARATE_ZVAL(array);
+ convert_to_array_ex(array);
+
+ argc = 1 + zend_hash_num_elements(Z_ARRVAL_PP(array));
+ newargs = (zval ***)safe_emalloc(argc, sizeof(zval *), 0);
+ newargs[0] = z_format;
+
+ for (zend_hash_internal_pointer_reset(Z_ARRVAL_PP(array));
+ zend_hash_get_current_data(Z_ARRVAL_PP(array), (void
**)&newargs[i++]) == SUCCESS;
+ zend_hash_move_forward(Z_ARRVAL_PP(array)));
+
+ efree(args);
+ args = newargs;
+ format_offset = 0;
+ }
+
+ convert_to_unicode_ex(args[format_offset]);
+ format = Z_USTRVAL_PP(args[format_offset]);
+ result = eumalloc(size);
+
+ currarg = 1;
+
+ while (inpos<Z_USTRLEN_PP(args[format_offset])) {
+ int expprec = 0, multiuse = 0;
+ zval *tmp;
+
+ if (format[inpos] != 0x25 /* '%' */) {
+ php_u_sprintf_appendchar(&result, &outpos, &size,
format[inpos++] TSRMLS_CC);
+ } else if (format[inpos + 1] == 0x25 /* '%' */) {
+ php_u_sprintf_appendchar(&result, &outpos, &size, 0x25
/* '%' */ TSRMLS_CC);
+ inpos += 2;
+ } else {
+ /* starting a new format specifier, reset variables */
+ alignment = ALIGN_RIGHT;
+ adjusting = 0;
+ padding = 0x20 /* ' ' */;
+ always_sign = 0;
+ inpos++; /* skip the '%' */
+
+ if ((format[inpos] < 0x7f) &&
!u_isalpha(format[inpos])) {
+ /* first look for argnum */
+ temppos = inpos;
+ while (format[temppos] >= 0x30 /* '0' */ &&
format[temppos] <= 0x39 /* '9' */) temppos++;
+ if (format[temppos] == 0x24 /* '$' */) {
+ argnum =
php_u_sprintf_getnumber(format, &inpos);
+
+ if (argnum == 0) {
+ efree(result);
+ efree(args);
+ php_error_docref(NULL
TSRMLS_CC, E_WARNING, "Zero is not a valid argument number");
+ return NULL_ZSTR;
+ }
+
+ multiuse = 1;
+ inpos++; /* skip the '$' */
+ } else {
+ argnum = currarg++;
+ }
+
+ argnum += format_offset;
+
+ /* after argnum comes modifiers */
+ for (;; inpos++) {
+ if (u_isspace(format[inpos]) ||
format[inpos] == 0x30 /* '0' */) {
+ padding = format[inpos];
+ } else if (format[inpos] == 0x2D /* '-'
*/) {
+ alignment = ALIGN_LEFT;
+ /* space padding, the default */
+ } else if (format[inpos] == 0x2B /* '+'
*/) {
+ always_sign = 1;
+ } else if (format[inpos] == 0x27 /*
'\'' */) {
+ padding = format[++inpos];
+ } else {
+ break;
+ }
+ }
+
+ /* after modifiers comes width */
+ if (isdigit((int)format[inpos])) {
+ width = php_u_sprintf_getnumber(format,
&inpos);
+ adjusting |= ADJ_WIDTH;
+ } else {
+ width = 0;
+ }
+
+ /* after width and argnum comes precision */
+ if (format[inpos] == 0x2E /* '.' */) {
+ inpos++;
+ if (format[inpos] >= 0x30 /* '0' */ &&
format[inpos] <= 0x39 /* '9' */) {
+ precision =
php_u_sprintf_getnumber(format, &inpos);
+ adjusting |= ADJ_PRECISION;
+ expprec = 1;
+ } else {
+ precision = 0;
+ }
+ } else {
+ precision = 0;
+ }
+ } else {
+ width = precision = 0;
+ argnum = currarg++ + format_offset;
+ }
+
+ if (argnum >= argc) {
+ efree(result);
+ efree(args);
+ php_error_docref(NULL TSRMLS_CC, E_WARNING,
"Too few arguments");
+ return NULL_ZSTR;
+ }
+
+ if (format[inpos] == 0x6C /* 'l' */) {
+ inpos++;
+ }
+ /* now we expect to find a type specifier */
+ if (multiuse) {
+ MAKE_STD_ZVAL(tmp);
+ *tmp = **(args[argnum]);
+ INIT_PZVAL(tmp);
+ zval_copy_ctor(tmp);
+ } else {
+ SEPARATE_ZVAL(args[argnum]);
+ tmp = *(args[argnum]);
+ }
+
+ switch (format[inpos]) {
+ case 0x73 /* 's' */: {
+ zval *var, var_copy;
+ int use_copy;
+
+ zend_make_unicode_zval(tmp, &var_copy,
&use_copy);
+ if (use_copy) {
+ var = &var_copy;
+ } else {
+ var = tmp;
+ }
+ php_u_sprintf_appendstring(&result,
&outpos, &size,
+
Z_USTRVAL_P(var),
+
width, precision, padding,
+
alignment,
+
Z_USTRLEN_P(var),
+
0, expprec, 0);
+ if (use_copy) {
+ zval_dtor(&var_copy);
+ }
+ break;
+ }
+
+ case 0x64 /* 'd' */:
+ convert_to_long(tmp);
+ php_u_sprintf_appendint(&result,
&outpos, &size,
+
Z_LVAL_P(tmp),
+
width, padding, alignment,
+
always_sign);
+ break;
+
+ case 0x75 /* 'u' */:
+ convert_to_long(tmp);
+ php_u_sprintf_appenduint(&result,
&outpos, &size,
+
Z_LVAL_P(tmp),
+
width, padding, alignment);
+ break;
+
+ case 0x67 /* 'g' */:
+ case 0x47 /* 'G' */:
+ case 0x65 /* 'e' */:
+ case 0x45 /* 'E' */:
+ case 0x66 /* 'f' */:
+ case 0x46 /* 'F' */:
+ convert_to_double(tmp);
+ php_u_sprintf_appenddouble(&result,
&outpos, &size,
+
Z_DVAL_P(tmp),
+
width, padding, alignment,
+
precision, adjusting,
+
format[inpos], always_sign
+
TSRMLS_CC);
+ break;
+
+ case 0x63 /* 'c' */:
+ convert_to_long(tmp);
+ php_u_sprintf_appendchar(&result,
&outpos, &size,
+
(char) Z_LVAL_P(tmp) TSRMLS_CC);
+ break;
+
+ case 0x6F /* 'o' */:
+ convert_to_long(tmp);
+ php_u_sprintf_append2n(&result,
&outpos, &size,
+
Z_LVAL_P(tmp),
+
width, padding, alignment, 3,
+
u_hexchars, expprec);
+ break;
+
+ case 0x78 /* 'x' */:
+ convert_to_long(tmp);
+ php_u_sprintf_append2n(&result,
&outpos, &size,
+
Z_LVAL_P(tmp),
+
width, padding, alignment, 4,
+
u_hexchars, expprec);
+ break;
+
+ case 0x58 /* 'X' */:
+ convert_to_long(tmp);
+ php_u_sprintf_append2n(&result,
&outpos, &size,
+
Z_LVAL_P(tmp),
+
width, padding, alignment, 4,
+
u_HEXCHARS, expprec);
+ break;
+
+ case 0x62 /* 'b' */:
+ convert_to_long(tmp);
+ php_u_sprintf_append2n(&result,
&outpos, &size,
+
Z_LVAL_P(tmp),
+
width, padding, alignment, 1,
+
u_hexchars, expprec);
+ break;
+
+ case 0x25 /* '%' */:
+ php_u_sprintf_appendchar(&result,
&outpos, &size, 0x25 /* '%' */ TSRMLS_CC);
+
+ break;
+ default:
+ break;
+ }
+ if (multiuse) {
+ zval_ptr_dtor(&tmp);
+ }
+ inpos++;
+ }
+ }
+
+ efree(args);
+
+ /* possibly, we have to make sure we have room for the terminating
null? */
+ result[outpos] = 0;
+ *len = outpos;
+ result_str.u = result;
+
+ switch (type) {
+ case PHP_OUTPUT:
+ {
+ UErrorCode status = U_ZERO_ERROR;
+ char *s;
+ int s_len;
+
+
zend_unicode_to_string_ex(ZEND_U_CONVERTER(UG(output_encoding_conv)), &s,
&s_len, result, outpos, &status);
+ if(U_FAILURE(status)) {
+ efree(s);
+ efree(result);
+ return NULL_ZSTR;
+ }
+
+ efree(result_str.v);
+ result_str.s = s;
+ *len = s_len;
+ break;
+ }
+ case PHP_RUNTIME:
+ default:
+ /* nothing to be done */
+ break;
+ }
+
+ return result_str;
+}
+/* }}} */
+
+
/* {{{ proto string sprintf(string format [, mixed arg1 [, mixed ...]])
Return a formatted string */
PHP_FUNCTION(user_sprintf)
{
- char *result;
int len;
-
- if ((result=php_formatted_print(ht, &len, 0, 0 TSRMLS_CC))==NULL) {
- RETURN_FALSE;
+ zstr result;
+
+ if (!UG(unicode)) {
+ if ((result.s = php_formatted_print(ht, &len, 0, 0, PHP_RUNTIME
TSRMLS_CC))==NULL) {
+ RETURN_FALSE;
+ }
+ RETVAL_STRINGL(result.s, len, 0);
+ } else {
+ result = php_u_formatted_print(ht, &len, 0, 0, PHP_RUNTIME
TSRMLS_CC);
+ if (result.v == NULL) {
+ RETURN_FALSE;
+ }
+ RETVAL_UNICODEL(result.u, len, 0);
}
- RETVAL_STRINGL(result, len, 0);
}
/* }}} */
@@ -648,13 +1266,21 @@ PHP_FUNCTION(user_sprintf)
Return a formatted string */
PHP_FUNCTION(vsprintf)
{
- char *result;
int len;
-
- if ((result=php_formatted_print(ht, &len, 1, 0 TSRMLS_CC))==NULL) {
- RETURN_FALSE;
+ zstr result;
+
+ if (!UG(unicode)) {
+ if ((result.s = php_formatted_print(ht, &len, 1, 0, PHP_RUNTIME
TSRMLS_CC))==NULL) {
+ RETURN_FALSE;
+ }
+ RETVAL_STRINGL(result.s, len, 0);
+ } else {
+ result = php_u_formatted_print(ht, &len, 1, 0, PHP_RUNTIME
TSRMLS_CC);
+ if (result.v == NULL) {
+ RETURN_FALSE;
+ }
+ RETVAL_UNICODEL(result.u, len, 0);
}
- RETVAL_STRINGL(result, len, 0);
}
/* }}} */
@@ -662,14 +1288,22 @@ PHP_FUNCTION(vsprintf)
Output a formatted string */
PHP_FUNCTION(user_printf)
{
- char *result;
int len;
-
- if ((result=php_formatted_print(ht, &len, 0, 0 TSRMLS_CC))==NULL) {
- RETURN_FALSE;
+ zstr result;
+
+ if (!UG(unicode)) {
+ if ((result.s = php_formatted_print(ht, &len, 0, 0, PHP_OUTPUT
TSRMLS_CC))==NULL) {
+ RETURN_FALSE;
+ }
+ } else {
+ result = php_u_formatted_print(ht, &len, 0, 0, PHP_OUTPUT
TSRMLS_CC);
+ if (result.v == NULL) {
+ RETURN_FALSE;
+ }
}
- PHPWRITE(result, len);
- efree(result);
+
+ PHPWRITE(result.s, len);
+ efree(result.v);
RETURN_LONG(len);
}
/* }}} */
@@ -678,14 +1312,22 @@ PHP_FUNCTION(user_printf)
Output a formatted string */
PHP_FUNCTION(vprintf)
{
- char *result;
int len;
+ zstr result;
- if ((result=php_formatted_print(ht, &len, 1, 0 TSRMLS_CC))==NULL) {
- RETURN_FALSE;
+ if (!UG(unicode)) {
+ if ((result.s = php_formatted_print(ht, &len, 1, 0, PHP_OUTPUT
TSRMLS_CC))==NULL) {
+ RETURN_FALSE;
+ }
+ } else {
+ result = php_u_formatted_print(ht, &len, 1, 0, PHP_OUTPUT
TSRMLS_CC);
+ if (result.v == NULL) {
+ RETURN_FALSE;
+ }
}
- PHPWRITE(result, len);
- efree(result);
+
+ PHPWRITE(result.s, len);
+ efree(result.v);
RETURN_LONG(len);
}
/* }}} */
@@ -696,8 +1338,8 @@ PHP_FUNCTION(fprintf)
{
php_stream *stream;
zval **arg1;
- char *result;
- int len;
+ zstr result;
+ int len, ret;
if (ZEND_NUM_ARGS() < 2) {
WRONG_PARAM_COUNT;
@@ -709,15 +1351,22 @@ PHP_FUNCTION(fprintf)
php_stream_from_zval(stream, arg1);
- if ((result=php_formatted_print(ht, &len, 0, 1 TSRMLS_CC))==NULL) {
- RETURN_FALSE;
+ if (!UG(unicode)) {
+ if ((result.s = php_formatted_print(ht, &len, 0, 1, PHP_RUNTIME
TSRMLS_CC))==NULL) {
+ RETURN_FALSE;
+ }
+ ret = php_stream_write(stream, result.s, len);
+ } else {
+ result = php_u_formatted_print(ht, &len, 0, 1, PHP_RUNTIME
TSRMLS_CC);
+ if (result.v == NULL) {
+ RETURN_FALSE;
+ }
+ ret = php_stream_write_unicode(stream, result.u, len);
}
+
+ efree(result.v);
- php_stream_write(stream, result, len);
-
- efree(result);
-
- RETURN_LONG(len);
+ RETURN_LONG(ret);
}
/* }}} */
@@ -727,8 +1376,8 @@ PHP_FUNCTION(vfprintf)
{
php_stream *stream;
zval **arg1;
- char *result;
- int len;
+ zstr result;
+ int len, ret;
if (ZEND_NUM_ARGS() != 3) {
WRONG_PARAM_COUNT;
@@ -740,15 +1389,22 @@ PHP_FUNCTION(vfprintf)
php_stream_from_zval(stream, arg1);
- if ((result=php_formatted_print(ht, &len, 1, 1 TSRMLS_CC))==NULL) {
- RETURN_FALSE;
+ if (!UG(unicode)) {
+ if ((result.s = php_formatted_print(ht, &len, 1, 1, PHP_RUNTIME
TSRMLS_CC))==NULL) {
+ RETURN_FALSE;
+ }
+ ret = php_stream_write(stream, result.s, len);
+ } else {
+ result = php_u_formatted_print(ht, &len, 1, 1, PHP_RUNTIME
TSRMLS_CC);
+ if (result.v == NULL) {
+ RETURN_FALSE;
+ }
+ ret = php_stream_write_unicode(stream, result.u, len);
}
- php_stream_write(stream, result, len);
-
- efree(result);
+ efree(result.v);
- RETURN_LONG(len);
+ RETURN_LONG(ret);
}
/* }}} */
--
PHP Internals - PHP Runtime Development Mailing List
To unsubscribe, visit: http://www.php.net/unsub.php