Skip to content

Commit

Permalink
Implement #77726: Allow null character in regex patterns
Browse files Browse the repository at this point in the history
In 8b3c1a3, this was disallowed to fix #55856, which was a security
issue caused by the /e modifier. The fix that was made was the
"Easier fix" as described in the original report.

With this fix, pattern strings are no longer treated as null terminated,
so null characters can be placed inside and matched against with regex
patterns without security problems, so there is no longer a reason to
give the error. Allowing this is consistent with the behaviour of many
other languages, including JavaScript, and thanks to PCRE2[0], it does
not require manually escaping null characters. Now that we can avoid the
error here without the cost of escaping characters, there is really no
need anymore to stray here from the conventional behaviour.

Currently, null characters are still disallowed before the first
delimiter and in the options section at the end of a regex string, but
these error messages have been updated.

[0] Since PCRE2, pattern strings no longer have to be null terminated,
and raw null characters match as normal.

Closes GH-8114.
  • Loading branch information
tobil4sk authored and cmb69 committed Jun 17, 2022
1 parent 98a4ab2 commit 5bb3e23
Show file tree
Hide file tree
Showing 14 changed files with 170 additions and 57 deletions.
3 changes: 3 additions & 0 deletions NEWS
Expand Up @@ -24,6 +24,9 @@ GD:
- ODBC:
. Fixed handling of single-key connection strings. (Calvin Buckley)

- PCRE:
. Implemented FR #77726 (Allow null character in regex patterns). (cmb)

- PDO_ODBC:
. Fixed handling of single-key connection strings. (Calvin Buckley)

Expand Down
3 changes: 3 additions & 0 deletions UPGRADING
Expand Up @@ -221,6 +221,9 @@ PHP 8.2 UPGRADE NOTES
- OCI8:
. The minimum Oracle Client library version required is now 11.2.

- PCRE:
. NUL characters (\0) in pattern strings are now supported.

- SQLite3:
. sqlite3.defensive is now PHP_INI_USER.

Expand Down
38 changes: 15 additions & 23 deletions ext/pcre/php_pcre.c
Expand Up @@ -624,7 +624,7 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in
pcre_cache_entry new_entry;
int rc;
zend_string *key;
pcre_cache_entry *ret;
pcre_cache_entry *ret;

if (locale_aware && BG(ctype_string)) {
key = zend_string_concat2(
Expand All @@ -645,28 +645,28 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in
}

p = ZSTR_VAL(regex);
const char* end_p = ZSTR_VAL(regex) + ZSTR_LEN(regex);

/* Parse through the leading whitespace, and display a warning if we
get to the end without encountering a delimiter. */
while (isspace((int)*(unsigned char *)p)) p++;
if (*p == 0) {
if (p >= end_p) {
if (key != regex) {
zend_string_release_ex(key, 0);
}
php_error_docref(NULL, E_WARNING,
p < ZSTR_VAL(regex) + ZSTR_LEN(regex) ? "Null byte in regex" : "Empty regular expression");
php_error_docref(NULL, E_WARNING, "Empty regular expression");
pcre_handle_exec_error(PCRE2_ERROR_INTERNAL);
return NULL;
}

/* Get the delimiter and display a warning if it is alphanumeric
or a backslash. */
delimiter = *p++;
if (isalnum((int)*(unsigned char *)&delimiter) || delimiter == '\\') {
if (isalnum((int)*(unsigned char *)&delimiter) || delimiter == '\\' || delimiter == '\0') {
if (key != regex) {
zend_string_release_ex(key, 0);
}
php_error_docref(NULL,E_WARNING, "Delimiter must not be alphanumeric or backslash");
php_error_docref(NULL, E_WARNING, "Delimiter must not be alphanumeric, backslash, or NUL");
pcre_handle_exec_error(PCRE2_ERROR_INTERNAL);
return NULL;
}
Expand All @@ -682,8 +682,8 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in
/* We need to iterate through the pattern, searching for the ending delimiter,
but skipping the backslashed delimiters. If the ending delimiter is not
found, display a warning. */
while (*pp != 0) {
if (*pp == '\\' && pp[1] != 0) pp++;
while (pp < end_p) {
if (*pp == '\\' && pp + 1 < end_p) pp++;
else if (*pp == delimiter)
break;
pp++;
Expand All @@ -695,8 +695,8 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in
* reach the end of the pattern without matching, display a warning.
*/
int brackets = 1; /* brackets nesting level */
while (*pp != 0) {
if (*pp == '\\' && pp[1] != 0) pp++;
while (pp < end_p) {
if (*pp == '\\' && pp + 1 < end_p) pp++;
else if (*pp == end_delimiter && --brackets <= 0)
break;
else if (*pp == start_delimiter)
Expand All @@ -705,13 +705,11 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in
}
}

if (*pp == 0) {
if (pp >= end_p) {
if (key != regex) {
zend_string_release_ex(key, 0);
}
if (pp < ZSTR_VAL(regex) + ZSTR_LEN(regex)) {
php_error_docref(NULL,E_WARNING, "Null byte in regex");
} else if (start_delimiter == end_delimiter) {
if (start_delimiter == end_delimiter) {
php_error_docref(NULL,E_WARNING, "No ending delimiter '%c' found", delimiter);
} else {
php_error_docref(NULL,E_WARNING, "No ending matching delimiter '%c' found", delimiter);
Expand All @@ -729,7 +727,7 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in

/* Parse through the options, setting appropriate flags. Display
a warning if we encounter an unknown modifier. */
while (pp < ZSTR_VAL(regex) + ZSTR_LEN(regex)) {
while (pp < end_p) {
switch (*pp++) {
/* Perl compatible options */
case 'i': coptions |= PCRE2_CASELESS; break;
Expand Down Expand Up @@ -764,9 +762,9 @@ PHPAPI pcre_cache_entry* pcre_get_compiled_regex_cache_ex(zend_string *regex, in

default:
if (pp[-1]) {
php_error_docref(NULL,E_WARNING, "Unknown modifier '%c'", pp[-1]);
php_error_docref(NULL, E_WARNING, "Unknown modifier '%c'", pp[-1]);
} else {
php_error_docref(NULL,E_WARNING, "Null byte in regex");
php_error_docref(NULL, E_WARNING, "NUL is not a valid modifier");
}
pcre_handle_exec_error(PCRE2_ERROR_INTERNAL);
efree(pattern);
Expand Down Expand Up @@ -2438,12 +2436,6 @@ PHP_FUNCTION(preg_replace_callback_array)
}

ZEND_HASH_FOREACH_STR_KEY_VAL(pattern, str_idx_regex, replace) {
if (!str_idx_regex) {
php_error_docref(NULL, E_WARNING, "Delimiter must not be alphanumeric or backslash");
RETVAL_NULL();
goto error;
}

if (!zend_is_callable_ex(replace, NULL, 0, NULL, &fcc, NULL)) {
zend_argument_type_error(1, "must contain only valid callbacks");
goto error;
Expand Down
2 changes: 1 addition & 1 deletion ext/pcre/tests/bug73392.phpt
Expand Up @@ -21,5 +21,5 @@ var_dump(preg_replace_callback_array(
), 'a'));
?>
--EXPECTF--
Warning: preg_replace_callback_array(): Delimiter must not be alphanumeric or backslash in %sbug73392.php on line %d
Warning: preg_replace_callback_array(): Delimiter must not be alphanumeric, backslash, or NUL in %sbug73392.php on line %d
NULL
6 changes: 5 additions & 1 deletion ext/pcre/tests/delimiters.phpt
Expand Up @@ -12,6 +12,7 @@ var_dump(preg_match('~a', ''));
var_dump(preg_match('@\@\@@', '@@'));
var_dump(preg_match('//z', '@@'));
var_dump(preg_match('{', ''));
var_dump(preg_match("\0\0", ''));

?>
--EXPECTF--
Expand All @@ -22,7 +23,7 @@ Warning: preg_match(): Empty regular expression in %sdelimiters.php on line 4
bool(false)
int(1)

Warning: preg_match(): Delimiter must not be alphanumeric or backslash in %sdelimiters.php on line 6
Warning: preg_match(): Delimiter must not be alphanumeric, backslash, or NUL in %sdelimiters.php on line 6
bool(false)
int(1)

Expand All @@ -35,3 +36,6 @@ bool(false)

Warning: preg_match(): No ending matching delimiter '}' found in %sdelimiters.php on line 11
bool(false)

Warning: preg_match(): Delimiter must not be alphanumeric, backslash, or NUL in %sdelimiters.php on line 12
bool(false)
76 changes: 50 additions & 26 deletions ext/pcre/tests/null_bytes.phpt
Expand Up @@ -3,40 +3,64 @@ Zero byte test
--FILE--
<?php

preg_match("\0//i", "");
preg_match("/\0/i", "");
preg_match("//\0i", "");
preg_match("//i\0", "");
preg_match("/\\\0/i", "");

preg_match("\0[]i", "");
preg_match("[\0]i", "");
preg_match("[]\0i", "");
preg_match("[]i\0", "");
preg_match("[\\\0]i", "");
var_dump(preg_match("\0//i", ""));
var_dump(preg_match("/\0/i", ""));
var_dump(preg_match("/\0/i", "\0"));
var_dump(preg_match("//\0i", ""));
var_dump(preg_match("//i\0", ""));
var_dump(preg_match("/\\\0/i", ""));
var_dump(preg_match("/\\\0/i", "\\\0"));

preg_replace("/foo/e\0/i", "echo('Eek');", "");

?>
--EXPECTF--
Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 3
var_dump(preg_match("\0[]i", ""));
var_dump(preg_match("[\0]i", ""));
var_dump(preg_match("[\0]i", "\0"));
var_dump(preg_match("[]\0i", ""));
var_dump(preg_match("[]i\0", ""));
var_dump(preg_match("[\\\0]i", ""));
var_dump(preg_match("[\\\0]i", "\\\0"));

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 4
var_dump(preg_match("/abc\0def/", "abc"));
var_dump(preg_match("/abc\0def/", "abc\0def"));
var_dump(preg_match("/abc\0def/", "abc\0fed"));

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 5
var_dump(preg_match("[abc\0def]", "abc"));
var_dump(preg_match("[abc\0def]", "abc\0def"));
var_dump(preg_match("[abc\0def]", "abc\0fed"));

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 6
preg_replace("/foo/e\0/i", "echo('Eek');", "");

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 7
?>
--EXPECTF--
Warning: preg_match(): Delimiter must not be alphanumeric, backslash, or NUL in %snull_bytes.php on line 3
bool(false)
int(0)
int(1)

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 9
Warning: preg_match(): NUL is not a valid modifier in %snull_bytes.php on line 6
bool(false)

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 10
Warning: preg_match(): NUL is not a valid modifier in %snull_bytes.php on line 7
bool(false)
int(0)
int(1)

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 11
Warning: preg_match(): Delimiter must not be alphanumeric, backslash, or NUL in %snull_bytes.php on line 11
bool(false)
int(0)
int(1)

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 12
Warning: preg_match(): NUL is not a valid modifier in %snull_bytes.php on line 14
bool(false)

Warning: preg_match(): Null byte in regex in %snull_bytes.php on line 13
Warning: preg_match(): NUL is not a valid modifier in %snull_bytes.php on line 15
bool(false)
int(0)
int(1)
int(0)
int(1)
int(0)
int(0)
int(1)
int(0)

Warning: preg_replace(): Null byte in regex in %snull_bytes.php on line 15
Warning: preg_replace(): NUL is not a valid modifier in %snull_bytes.php on line 27
2 changes: 1 addition & 1 deletion ext/pcre/tests/preg_grep_error1.phpt
Expand Up @@ -37,7 +37,7 @@ echo "Done"

Arg value is abcdef

Warning: preg_grep(): Delimiter must not be alphanumeric or backslash in %spreg_grep_error1.php on line %d
Warning: preg_grep(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_grep_error1.php on line %d
bool(false)

Arg value is /[a-zA-Z]
Expand Down
2 changes: 1 addition & 1 deletion ext/pcre/tests/preg_match_all_error1.phpt
Expand Up @@ -38,7 +38,7 @@ var_dump($matches);

Arg value is abcdef

Warning: preg_match_all(): Delimiter must not be alphanumeric or backslash in %spreg_match_all_error1.php on line %d
Warning: preg_match_all(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_match_all_error1.php on line %d
bool(false)
NULL

Expand Down
2 changes: 1 addition & 1 deletion ext/pcre/tests/preg_match_error1.phpt
Expand Up @@ -34,7 +34,7 @@ try {

Arg value is abcdef

Warning: preg_match(): Delimiter must not be alphanumeric or backslash in %spreg_match_error1.php on line %d
Warning: preg_match(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_match_error1.php on line %d
bool(false)

Arg value is /[a-zA-Z]
Expand Down
66 changes: 66 additions & 0 deletions ext/pcre/tests/preg_replace_callback_array_error.phpt
@@ -0,0 +1,66 @@
--TEST--
preg_replace_callback_array() errors
--FILE--
<?php

function b() {
return "b";
}

// empty strings

var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
"" => function () { return "ok"; }), 'a'));

var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
null => function () { return "ok"; }), 'a'));

// backslashes

var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
"\\b\\" => function () { return "ok"; }), 'a'));

// alphanumeric delimiters

var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
"aba" => function () { return "ok"; }), 'a'));

var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
"1b1" => function () { return "ok"; }), 'a'));

// null character delimiter

var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
"\0b\0" => function () { return "ok"; }), 'a'));

?>
--EXPECTF--
Warning: preg_replace_callback_array(): Empty regular expression in %spreg_replace_callback_array_error.php on line 12
NULL

Warning: preg_replace_callback_array(): Empty regular expression in %spreg_replace_callback_array_error.php on line 17
NULL

Warning: preg_replace_callback_array(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_replace_callback_array_error.php on line 24
NULL

Warning: preg_replace_callback_array(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_replace_callback_array_error.php on line 31
NULL

Warning: preg_replace_callback_array(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_replace_callback_array_error.php on line 36
NULL

Warning: preg_replace_callback_array(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_replace_callback_array_error.php on line 43
NULL
21 changes: 21 additions & 0 deletions ext/pcre/tests/preg_replace_callback_array_fatal_error.phpt
@@ -0,0 +1,21 @@
--TEST--
preg_replace_callback_array() invalid callable
--FILE--
<?php

function b() {
return "b";
}

// invalid callable
var_dump(preg_replace_callback_array(
array(
"/a/" => 'b',
"/b/" => 'invalid callable'), 'a'));

--EXPECTF--
Fatal error: Uncaught TypeError: preg_replace_callback_array(): Argument #1 ($pattern) must contain only valid callbacks in %spreg_replace_callback_array_fatal_error.php:11
Stack trace:
#0 %spreg_replace_callback_array_fatal_error.php(11): preg_replace_callback_array(Array, 'a')
#1 {main}
thrown in %spreg_replace_callback_array_fatal_error.php on line 11
2 changes: 1 addition & 1 deletion ext/pcre/tests/preg_replace_callback_error1.phpt
Expand Up @@ -30,7 +30,7 @@ foreach($regex_array as $regex_value) {

Arg value is abcdef

Warning: preg_replace_callback(): Delimiter must not be alphanumeric or backslash in %s on line %d
Warning: preg_replace_callback(): Delimiter must not be alphanumeric, backslash, or NUL in %s on line %d
NULL

Arg value is /[a-zA-Z]
Expand Down
2 changes: 1 addition & 1 deletion ext/pcre/tests/preg_replace_error1.phpt
Expand Up @@ -33,7 +33,7 @@ try {

Arg value is abcdef

Warning: preg_replace(): Delimiter must not be alphanumeric or backslash in %spreg_replace_error1.php on line %d
Warning: preg_replace(): Delimiter must not be alphanumeric, backslash, or NUL in %spreg_replace_error1.php on line %d
NULL

Arg value is /[a-zA-Z]
Expand Down

0 comments on commit 5bb3e23

Please sign in to comment.