public static function cutForSearch($sentence, $options = array())
{
$defaults = array('mode' => 'default');
$options = array_merge($defaults, $options);
$seg_list = array();
$cut_seg_list = Jieba::cut($sentence);
foreach ($cut_seg_list as $w) {
$len = mb_strlen($w, 'UTF-8');
if ($len > 2) {
for ($i = 0; $i < $len - 1; $i++) {
$gram2 = mb_substr($w, $i, 2, 'UTF-8');
if (isset(self::$FREQ[$gram2])) {
array_push($seg_list, $gram2);
}
}
}
if (mb_strlen($w, 'UTF-8') > 3) {
for ($i = 0; $i < $len - 2; $i++) {
$gram3 = mb_substr($w, $i, 3, 'UTF-8');
if (isset(self::$FREQ[$gram3])) {
array_push($seg_list, $gram3);
}
}
}
array_push($seg_list, $w);
}
return $seg_list;
}
* * PHP version 5 * * @category PHP * @package /src/cmd/ * @author Fukuball Lin <*****@*****.**> * @license MIT Licence * @version GIT: <fukuball/jieba-php> * @link https://github.com/fukuball/jieba-php */ ini_set('memory_limit', '600M'); require_once dirname(dirname(__FILE__)) . "/vendor/multi-array/MultiArray.php"; require_once dirname(dirname(__FILE__)) . "/vendor/multi-array/Factory/MultiArrayFactory.php"; require_once dirname(dirname(__FILE__)) . "/class/Jieba.php"; require_once dirname(dirname(__FILE__)) . "/class/Finalseg.php"; use Fukuball\Jieba\Jieba; use Fukuball\Jieba\Finalseg; Jieba::init(array('mode' => 'test', 'dict' => 'samll')); Finalseg::init(); $seg_list = Jieba::cut("怜香惜玉也得要看对象啊!"); var_dump($seg_list); echo "Full Mode: \n"; $seg_list = Jieba::cut("我来到北京清华大学", true); var_dump($seg_list); echo "Default Mode: \n"; $seg_list = Jieba::cut("我来到北京清华大学", false); var_dump($seg_list); $seg_list = Jieba::cut("他来到了网易杭研大厦"); var_dump($seg_list); $seg_list = Jieba::cutForSearch("小明硕士毕业于中国科学院计算所,后在日本京都大学深造"); var_dump($seg_list);