首页 > 代码库 > php 正则抓去页面函数整理

php 正则抓去页面函数整理

整理了下抓取页面的一些函数 方便以后使用 

 

 //抓取页面function getcontents($url) {    $ch = curl_init();     $timeout = 5;     curl_setopt($ch, CURLOPT_URL, $url);     curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);     curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, $timeout);     $contents = curl_exec($ch);     return $contents;}//抓取tablefunction get_td_array($table) {    // 去掉 HTML 标记属性    $table = preg_replace("‘<table[^>]*?>‘si", "", $table);    $table = preg_replace("‘<tr[^>]*?>‘si", "", $table);    $table = preg_replace("‘<td[^>]*?>‘si", "", $table);    $table = str_replace("</tr>", "{tr}", $table);    $table = str_replace("</td>", "{td}", $table);    // 去掉 HTML 标记        $table = preg_replace("‘<[\/\!]*?[^<>]*?>‘si", "", $table);        // 去掉空白字符    $table = preg_replace("‘([\r\n])[\s]+‘", "", $table);    $table = str_replace(" ", "", $table);    $table = str_replace(" ", "", $table);        $table = explode(‘{tr}‘, $table);    array_pop($table);    foreach ($table as $key => $tr) {        $td = explode(‘{td}‘, $tr);        array_pop($td);        $td_array[] = $td;    }     return $td_array;}//post提交数据 模拟采集页面function curlPost($url,$postData=http://www.mamicode.com/array()) {"";    foreach ($postData as $k=>$v){        $o.= "$k=".urlencode($v)."&";    }    $postData=http://www.mamicode.com/substr($o,0,-1);>

  

 

php 正则抓去页面函数整理