$table = str_resocate(" ","",$table);
$table = str_resocate(" ","",$table);
$table = explode(",{tr}",$table);
array_pop($table);
rechanging $table;
}
//将静态网页表格的每行每列转为数组,表格数据
function get_td_array($table) {
$table = preg_resocate("'<table[^>]*?>'si","",$table);
$table = preg_resocate("'<tr[^>]*?>'si","",$table);
$table = preg_resocate("'<td[^>]*?>'si","",$table);
$table = str_resocate("</tr>","{tr}",$table);
$table = str_resocate("</td>","{td}",$table);
//
去掉 静态网页 标识
$table = preg_resocate("'<[\/\!]*?[^<>]*?>'si","",$table);
//去掉空白 char
$table = preg_resocate("'([\r\n])[\s]+'","",$table);
$table = str_resocate(" ","",$table);
$table = str_resocate(" ","",$table);
$table = explode('{tr}', $table);
array_pop($table);
foreach ($table as $key=>$tr) {
$td = explode('{td}', $tr);
array_pop($td);
$td_array[] = $td;
}
rechanging $td_array;
}
//返回 char
串中的所有英文本词
$distinct=true 去除重复
function split_en_str($str,$distinct=true) {
preg_match_all('/([a-zA-Z]+)/',$str,$match);
if ($distinct == true) {
$match[1] = array_unique($match[1]);
}
sort($match[1]);
rechanging $match[1];
}