]> granicus.if.org Git - php/commitdiff
- Fix bug #53273 (mb_strcut() returns garbage with the excessive length parameter).
authorMoriyoshi Koizumi <moriyoshi@php.net>
Tue, 9 Nov 2010 03:23:04 +0000 (03:23 +0000)
committerMoriyoshi Koizumi <moriyoshi@php.net>
Tue, 9 Nov 2010 03:23:04 +0000 (03:23 +0000)
ext/mbstring/libmbfl/mbfl/mbfilter.c
ext/mbstring/tests/mb_strcut_missing_boundary_check.phpt [new file with mode: 0644]

index d11cebe447c3acd1bb3779ba9294268a933c56d0..b8b1db26838101a123bed41a7a0016d69b379773 100644 (file)
@@ -1397,6 +1397,10 @@ mbfl_strcut(
                        start = string->val + from;
                        end   = start + (length & -4);
                } else if ((encoding->flag & MBFL_ENCTYPE_SBCS)) {
+                       if (from + length >= string->len) {
+                               length = string->len - from;
+                       }
+
                        start = string->val + from;
                        end = start + length;
                } else if (encoding->mblen_table != NULL) {
diff --git a/ext/mbstring/tests/mb_strcut_missing_boundary_check.phpt b/ext/mbstring/tests/mb_strcut_missing_boundary_check.phpt
new file mode 100644 (file)
index 0000000..a67b99e
--- /dev/null
@@ -0,0 +1,31 @@
+--TEST--
+mb_strcut() missing boundary check.
+--SKIPIF--
+<?php
+extension_loaded('mbstring') or die('skip');
+function_exists('mb_convert_encoding') or die("skip mb_convert_encoding() is not available in this build");
+?>
+--FILE--
+<?php
+mb_internal_encoding("UCS-4LE");
+var_dump(bin2hex(mb_strcut("\x61\x00\x00\x00\x62\x00\x00\x00\x63\x00\x00\x00", 0, 32)));
+mb_internal_encoding("UCS-4BE");
+var_dump(bin2hex(mb_strcut("\x00\x00\x00\x61\x00\x00\x00\x62\x00\x00\x00\x63", 0, 32)));
+mb_internal_encoding("UCS-2LE");
+var_dump(bin2hex(mb_strcut("\x61\x00\x62\x00\x63\x00", 0, 32)));
+mb_internal_encoding("UCS-2BE");
+var_dump(bin2hex(mb_strcut("\x00\x61\x00\x62\x00\x63", 0, 32)));
+mb_internal_encoding("UTF-16");
+var_dump(bin2hex(mb_strcut("\x00\x61\x00\x62\x00\x63", 0, 32)));
+mb_internal_encoding("UTF-8");
+var_dump(bin2hex(mb_strcut("abc", 0, 32)));
+mb_internal_encoding("ISO-8859-1");
+var_dump(bin2hex(mb_strcut("abc", 0, 32)));
+--EXPECT--
+string(24) "610000006200000063000000"
+string(24) "000000610000006200000063"
+string(12) "610062006300"
+string(12) "006100620063"
+string(12) "006100620063"
+string(6) "616263"
+string(6) "616263"