php-src/ext/mbstring/tests/mb_ereg_variation4.phpt

151 lines
3.0 KiB
PHP
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

--TEST--
Test mb_ereg() function : usage variations - pass different character classes as pattern for multibyte string
--SKIPIF--
<?php
extension_loaded('mbstring') or die('skip');
function_exists('mb_ereg') or die("skip mb_ereg() is not available in this build");
?>
--FILE--
<?php
/* Prototype : int mb_ereg(string $pattern, string $string [, array $registers])
* Description: Regular expression match for multibyte string
* Source code: ext/mbstring/php_mbregex.c
*/
/*
* Test how character classes match a multibyte string
*/
echo "*** Testing mb_ereg() : usage variations ***\n";
mb_regex_encoding('utf-8');
//contains japanese characters, ASCII digits and different, UTF-8 encoded digits
$string_mb = base64_decode('5pel5pys6Kqe44OG44Kt44K544OI44Gn44GZMDEyMzTvvJXvvJbvvJfvvJjvvJnjgII=');
$character_classes = array (b'[[:alnum:]]+', /*1*/
b'[[:alpha:]]+',
b'[[:ascii:]]+',
b'[[:blank:]]+',
b'[[:cntrl:]]+',/*5*/
b'[[:digit:]]+',
b'[[:graph:]]+',
b'[[:lower:]]+',
b'[[:print:]]+',
b'[[:punct:]]+', /*10*/
b'[[:space:]]+',
b'[[:upper:]]+',
b'[[:xdigit:]]+'); /*13*/
$iterator = 1;
foreach ($character_classes as $pattern) {
if (is_array(@$regs)) {
$regs = null;
}
echo "\n-- Iteration $iterator --\n";
var_dump(mb_ereg($pattern, $string_mb, $regs));
if ($regs) {
base64_encode_var_dump($regs);
}
$iterator++;
}
/**
* replicate a var dump of an array but outputted string values are base64 encoded
*
* @param array $regs
*/
function base64_encode_var_dump($regs) {
if ($regs) {
echo "array(" . count($regs) . ") {\n";
foreach ($regs as $key => $value) {
echo " [$key]=>\n ";
if (is_unicode($value)) {
var_dump(base64_encode($value));
} else {
var_dump($value);
}
}
echo "}\n";
} else {
echo "NULL\n";
}
}
echo "Done";
?>
--EXPECTF--
*** Testing mb_ereg() : usage variations ***
-- Iteration 1 --
int(47)
array(1) {
[0]=>
string(47) "日本語テキストです01234"
}
-- Iteration 2 --
int(27)
array(1) {
[0]=>
string(27) "日本語テキストです"
}
-- Iteration 3 --
int(5)
array(1) {
[0]=>
string(5) "01234"
}
-- Iteration 4 --
bool(false)
-- Iteration 5 --
bool(false)
-- Iteration 6 --
int(20)
array(1) {
[0]=>
string(20) "01234"
}
-- Iteration 7 --
int(50)
array(1) {
[0]=>
string(50) "日本語テキストです01234。"
}
-- Iteration 8 --
bool(false)
-- Iteration 9 --
int(50)
array(1) {
[0]=>
string(50) "日本語テキストです01234。"
}
-- Iteration 10 --
int(3)
array(1) {
[0]=>
string(3) "。"
}
-- Iteration 11 --
bool(false)
-- Iteration 12 --
bool(false)
-- Iteration 13 --
int(5)
array(1) {
[0]=>
string(5) "01234"
}
Done