$string = "67. No one knows . 没有人知道。"; $s = str_replace("。", ".", $string); $s = str_replace(".", ".", $s); $s = str_replace("’", "'", $s); $s = str_replace(",", ",", $s); $s = str_replace("“", '"', $s); $s = str_replace("”", '"', $s); $s = str_replace(",", ",", $s); $len = mb_strlen($s,'UTF-8'); $j = 0;$k = 0; for($i=0;$i<$len;$i++){ $str = mb_substr($s, $i,1,'UTF-8'); if ($k==0&&preg_match('/[a-zA-Z]/', $str)) { $j = $i;$k=1; } if (!empty($str)&&preg_match('/[^x00-x80]/', $str)) { break; } } $one['str'] = $s; $one['en'] = mb_substr($s, $j,$i-$j,'UTF-8'); $one['zh'] = str_replace(" ", "", mb_substr($s, $i,$len-$i,'UTF-8')); var_dump($one);
结果
array(3) { ["str"]=> string(35) "67. No one knows . 没有人知道." ["en"]=> string(15) "No one knows . " ["zh"]=> string(16) "没有人知道." }