//将HTML表格的每行每列转为数组,采集表格数据
<?
function get_td_array($table) {
        $table = preg_replace("'<table[^>]*?>'si","",$table); //OSPHP.com.CN
        $table = preg_replace("'<tr[^>]*?>'si","",$table);
        $table = preg_replace("'<td[^>]*?>'si","",$table);
        $table = str_replace("</tr>","{tr}",$table);
//OSPHP.com.CN

        $table = str_replace("</td>","{td}",$table);
        //去掉 HTML 标记 
        $table = preg_replace("'<[/!]*?[^<>]*?>'si","",$table); //OSPHP.COm.CN
        //去掉空白字符  
        $table = preg_replace("'([rn])[s]+'","",$table);
        $table = str_replace(" ","",$table);
//OSPHP.com.CN


        $table = str_replace(" ","",$table);
        
        $table = explode('{tr}', $table);
        array_pop($table); //开源代码OSPHP.COM.Cn
        foreach ($table as $key=>$tr) {
                $td = explode('{td}', $tr);
                array_pop($td);
            $td_array[] = $td; //开源代码OSPhP.COm.CN
        }
        return $td_array;
}

?>


 
//返回字符串中的所有单词 $distinct=true 去除重复
<?
function split_en_str($str,$distinct=true) {
        preg_match_all('/([a-zA-Z]+)/',$str,$match); //PHP开源代码
        if ($distinct == true) {
                $match[1] = array_unique($match[1]);
        }
        sort($match[1]);
//OsPHP.COM.CN


        return $match[1];
}
?>