作者:书友64457430 | 来源:互联网 | 2018-03-23 17:34
跳至
db = $db;
}
function geturlfile($url) {
$url = trim($url);
$cOntent= '';
if (extension_loaded('curl')) {
$ch = curl_init();
curl_setopt($ch, CURLOPT_URL, $url);
curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
curl_setopt($ch, CURLOPT_FOLLOWLOCATION, 1);
curl_setopt($ch, CURLOPT_HEADER, 0);
$cOntent= curl_exec($ch);
curl_close($ch);
} else {
$cOntent= file_get_contents($url);
}
return trim($content);
}
function get_all_url($code) {
preg_match_all('/"\' ]+)["|\']?\s*[^>]*>([^>]+)/is', $code, $arr);
return array('name' => $arr[2], 'url' => $arr[1]);
}
function get_sub_content($str, $start, $end) {
$start = trim($start);
$end = trim($end);
if ($start == '' || $end == '') {
return $str;
}
$str = explode($start, $str);
$str = explode($end, $str[1]);
return $str[0];
}
function vd($var) {
echo "\r\n";
echo "\r\n";
var_dump($var);
echo "\r\n\r\n";
echo "";
}
}
?>geturlfile($url);
//定义采集列表区间
$start = '';
$end = '';
//获取区间内的文章URL和TITLE
$code = $gather->get_sub_content($html, $start, $end);
$newsAry = $gather->get_all_url($code);
//打印出结果
//$gather->vd($newsAry);
$tarGetUrl = $newsAry['url'][0];
//获取目标网址HTML
$html = $gather->geturlfile($tarGetUrl);
//定义采集列表区间
$start = '';
$end = '';
//获取区间内的文章URL和TITLE
$code = $gather->get_sub_content($html, $start, $end);
$killHtml = '';
$killHtml2 = '';
$code = str_replace($killHtml, "", $code);
$code = str_replace($killHtml2, "", $code);
$gather->vd($code);
?>