@@ -34,6 +34,8 @@ var_dump(mb_levenshtein('111', '121', 2, 3, 2));
34
34
echo '--- Very expensive replacement --- ' . \PHP_EOL ;
35
35
var_dump (mb_levenshtein ('111 ' , '121 ' , 2 , 9 , 2 ));
36
36
37
+ echo '--- 128 codepoints --- ' . \PHP_EOL ;
38
+ var_dump (mb_levenshtein (str_repeat ("a " , 128 ), str_repeat ("a " , 125 ) . "abc " ));
37
39
echo '--- 128 codepoints over --- ' . \PHP_EOL ;
38
40
var_dump (mb_levenshtein (str_repeat ("a " , 128 ) . "abc " , str_repeat ("a " , 128 ) . "aaa " ));
39
41
echo '--- 128 codepoints over only $string1 --- ' . \PHP_EOL ;
@@ -48,6 +50,10 @@ $hiragana_a = mb_convert_encoding("あ", "SJIS", "UTF-8");
48
50
$ hiragana_aiu = mb_convert_encoding ("あいう " , "SJIS " , "UTF-8 " );
49
51
var_dump (mb_levenshtein (str_repeat ($ hiragana_a , 128 + 3 ), str_repeat ($ hiragana_a , 128 ) . $ hiragana_aiu , encoding: "SJIS " ));
50
52
53
+ echo '--- café in ISO-8859-1 --- ' . \PHP_EOL ;
54
+ $ cafe = mb_convert_encoding ("café " , "ISO-8859-1 " , "UTF-8 " );
55
+ var_dump (mb_levenshtein ("cafe " , $ cafe , encoding: "ISO-8859-1 " ));
56
+
51
57
echo '--- Usecase of userland code --- ' . \PHP_EOL ;
52
58
/* from: https://qiita.com/mpyw/items/2b636827730e06c71e3d */
53
59
$ query = 'ほあようごぁいまーしゅ ' ;
@@ -113,6 +119,8 @@ int(10)
113
119
int(3)
114
120
--- Very expensive replacement ---
115
121
int(4)
122
+ --- 128 codepoints ---
123
+ int(2)
116
124
--- 128 codepoints over ---
117
125
int(2)
118
126
--- 128 codepoints over only $string1 ---
@@ -123,6 +131,8 @@ int(130)
123
131
int(2)
124
132
--- 128 codepoints over Hiragana in Shift_JIS ---
125
133
int(2)
134
+ --- café in ISO-8859-1 ---
135
+ int(1)
126
136
--- Usecase of userland code ---
127
137
string(30) "おはようございまーす"
128
138
int(4)
0 commit comments