|
|
@@ -56,12 +56,11 @@ class CaseMan
|
|
|
if ($wordEnd === $ending[0]) {
|
|
|
//匹配成功
|
|
|
$word = mb_substr($base, 0, mb_strlen($base, "UTF-8") - $endingLen, "UTF-8") . $ending[1];
|
|
|
-
|
|
|
//尝试sandhi
|
|
|
//TODO 加两个sandhi
|
|
|
$hasSandhi = false;
|
|
|
foreach ($case->union as $sandhi) {
|
|
|
- $sandhiLen = strlen($sandhi[0]);
|
|
|
+ $sandhiLen = mb_strlen($sandhi[0],'UTF-8');
|
|
|
$sandhiEnd = mb_substr($word, 0 - $sandhiLen, null, "UTF-8");
|
|
|
if ($sandhiEnd === $sandhi[0]) {
|
|
|
$sandhiWord = mb_substr($word, 0, mb_strlen($word, "UTF-8") - $sandhiLen, "UTF-8") . $sandhi[1];
|