zdc253212956 发表于 2017-3-30 12:03:28

php 统计可读字数

$recordset = array(array('body'=>'<h1 data-role="title">中国人</h1><div data-role="author"></div><div data-role="content">李34团%$长教#@$导我,们.说,<青>年学子应该《参军》。李?!~老【团长--还教】导,我aa们说,接b受t军“队”的管理?和...再!教育。\n</div><div data-role="source"></div>'));
foreach ($recordset as $k =>$v){
if($v['body'] != ''){
$title = $content = array();
preg_match('/<h1 data-role="title">(.*)<\/h1>/U',$v['body'],$title );
$recordset[$k]['article_title'] = isset($title)?$title:'';
preg_match('/<div data-role="content">(.*)<\/div>/smU',$v['body'],$content);
//print_r($content);
$content = isset($content)?preg_replace('/[<(.*?)>|\\\\r|\\\\n]/', '', $content):'';
preg_match_all("/[\x{4E00}-\x{9FA5}]+/u",$content,$match);
$clean = implode($match);
preg_match_all("/[\d\w]+/",$content,$match);
$clean .= implode($match);
//echo $clean;
$recordset[$k]['word_count'] = mb_strlen($clean,'UTF-8');
unset($recordset[$k]['body']);
}
}

print_r($recordset);
页: [1]
查看完整版本: php 统计可读字数