From: Moriyoshi Koizumi Date: Wed, 10 Dec 2003 07:15:28 +0000 (+0000) Subject: Fix bug #26574 (basename() doesn't work properly with multibyte characters) X-Git-Tag: php-5.0.0b3RC1~153 X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=b2cd08f33dcc1c0b5d318370625a01fa0323cded;p=php Fix bug #26574 (basename() doesn't work properly with multibyte characters) --- diff --git a/ext/standard/ftp_fopen_wrapper.c b/ext/standard/ftp_fopen_wrapper.c index 6d4014fdd9..52a4e4e289 100644 --- a/ext/standard/ftp_fopen_wrapper.c +++ b/ext/standard/ftp_fopen_wrapper.c @@ -562,7 +562,7 @@ static size_t php_ftp_dirstream_read(php_stream *stream, char *buf, size_t count php_stream *innerstream = (php_stream *)stream->abstract; size_t tmp_len; char *basename; - int basename_len; + size_t basename_len; if (count != sizeof(php_stream_dirent)) { return 0; @@ -586,8 +586,9 @@ static size_t php_ftp_dirstream_read(php_stream *stream, char *buf, size_t count return 0; } - memcpy(ent->d_name, basename, MIN((int)sizeof(ent->d_name), basename_len)-1); - ent->d_name[sizeof(ent->d_name)-1] = '\0'; + tmp_len = MIN(sizeof(ent->d_name), basename_len) - 1; + memcpy(ent->d_name, basename, tmp_len); + ent->d_name[tmp_len] = '\0'; efree(basename); return sizeof(php_stream_dirent); diff --git a/ext/standard/php_string.h b/ext/standard/php_string.h index a7882dba96..fea95e53cb 100644 --- a/ext/standard/php_string.h +++ b/ext/standard/php_string.h @@ -122,7 +122,7 @@ PHPAPI char *php_addslashes(char *str, int length, int *new_length, int freeit T PHPAPI char *php_addcslashes(char *str, int length, int *new_length, int freeit, char *what, int wlength TSRMLS_DC); PHPAPI void php_stripslashes(char *str, int *len TSRMLS_DC); PHPAPI void php_stripcslashes(char *str, int *len); -PHPAPI void php_basename(char *str, size_t len , char *suffix, size_t sufflen, char **p_ret, int *p_len); +PHPAPI void php_basename(char *str, size_t len , char *suffix, size_t sufflen, char **p_ret, size_t *p_len); PHPAPI size_t php_dirname(char *str, size_t len); PHPAPI char *php_stristr(unsigned char *s, unsigned char *t, size_t s_len, size_t t_len); PHPAPI char *php_str_to_str_ex(char *haystack, int length, char *needle, diff --git a/ext/standard/string.c b/ext/standard/string.c index 23e505ba23..347bf07697 100644 --- a/ext/standard/string.c +++ b/ext/standard/string.c @@ -1068,56 +1068,69 @@ PHP_FUNCTION(strtolower) /* {{{ php_basename */ -PHPAPI void php_basename(char *s, size_t len, char *suffix, size_t sufflen, char **p_ret, int *p_len) +PHPAPI void php_basename(char *s, size_t len, char *suffix, size_t sufflen, char **p_ret, size_t *p_len) { - char *ret=NULL, *c; - c = s + len - 1; - - /* strip trailing slashes */ - while (*c == '/' + char *ret = NULL, *c, *comp, *cend; + size_t inc_len, cnt; + int state; + + c = comp = cend = s; + cnt = len; + state = 0; + while (cnt > 0) { + inc_len = (*c == '\0' ? 1: php_mblen(c, cnt)); + + switch (inc_len) { + case -2: + case -1: + inc_len = 1; + php_mblen(NULL, 0); + break; + case 0: + goto quit_loop; + case 1: #ifdef PHP_WIN32 - || (*c == '\\' && !IsDBCSLeadByte(*(c-1))) + if (*c == '/' || *c == '\\') { +#else + if (*c == '/') { #endif - ) { - c--; - len--; + if (state == 1) { + state = 0; + cend = c; + } + } else { + if (state == 0) { + comp = c; + state = 1; + } + } + default: + break; + } + c += inc_len; + cnt -= inc_len; } - /* do suffix removal as the unix command does */ - if (suffix && (len > sufflen)) { - if (!memcmp(suffix, c-sufflen+1, sufflen)) { - if( (*(c-sufflen) != '/') -#ifdef PHP_WIN32 - && ( *(c-sufflen) != '\\' || IsDBCSLeadByte(*(c-sufflen-1))) -#endif - ) { - c -= sufflen; - len -= sufflen; - } - } +quit_loop: + if (state == 1) { + cend = c; } - - while(c>=s) { - if(*c == '/' -#ifdef PHP_WIN32 - || ( *c == '\\' && !IsDBCSLeadByte(*(c-1))) -#endif - ) { - c++; - break; - } - c--; + if (suffix != NULL && sufflen < (cend - comp) && + memcmp(cend - sufflen, suffix, sufflen) == 0) { + cend -= sufflen; } - if (c