/除去字串中的重复词,生成索引字符串,字符串参数为已经分词处理的串
//--------------------------------------------------
function getindextext($okstr,$ilen=-1)
{
if($okstr==) return ;
$ws = explode( ,$okstr);
$okstr = ;
$wks = ;
foreach($ws as $w)
{
$w = trim($w);
//排除小于2的字符
if(strlen($w) //排除数字或日期
if(!ereg([^0-9:-],$w)) continue;
if(strlen($w)==2&&ord($w[0])>0x80) continue;
if(isset($wks[$w])) $wks[$w]++;
else $wks[$w] = 1;
}
if(is_array($wks))
{
arsort($wks);
if($ilen==-1)
{ foreach($wks as $w=>$v) $okstr .= $w. ; }
else
{
foreach($wks as $w=>$v){
if((strlen($okstr)+strlen($w)+1) else break;
}
}
}
return trim($okstr);
}?>
http://www.bkjia.com/phpjc/444908.htmlwww.bkjia.comtruehttp://www.bkjia.com/phpjc/444908.htmltecharticle/除去字串中的重复词,生成索引字符串,字符串参数为已经分词处理的串 //-------------------------------------------------- function getindextext($okstr,...