首页 > PHP, SEO > 百度排名抓取

百度排名抓取

function s($keyword,$url,$page = 1){
static $px = 0;
$rsState = false;

$enKeyword = urlencode($keyword);
$firstRow = ($page – 1) * 10;

if($page > 10){
die(’10页之内没有该网站排名..end’);
}
$contents = file_get_contents(“http://www.baidu.com/s?wd=$enKeyword&&pn=$firstRow”);
preg_match_all(‘/<table[^>]*?class=”result”[^>]*>[\s\S]*?<\/table>/i’,$contents,$rs);
foreach($rs[0] as $k=>$v){
$px++;
if(strstr($v,$url)){
$rsState = true;
preg_match_all(‘/<h3[\s\S]*?(<a[\s\S]*?<\/a>)/’,$v,$rs_t);
echo ‘当前 “‘ . $url . ‘” 在百度关键字 “‘ . $keyword . ‘” 中的排名为:’ . $px;
echo ‘<br>’;
echo ‘第’ . $page . ‘页;第’ . ++$k . “个<a target=’_blank’ href=’http://www.baidu.com/s?wd=$enKeyword&&pn=$firstRow’>进入百度</a>&#8221;;
echo ‘<br>’;
echo $rs_t[1][0];
break;
}
}
unset($contents);
if($rsState === false){
s($keyword, $url,++$page);
}
}
if(isset($_POST[‘submit’])){

$time = explode(‘ ‘,microtime());
$start = $time[0] + $time[1];

$url = $_POST[‘url’];
if( count(explode(‘.’,$url)) <= 2){

$url = ltrim($url,’http://&#8217;);
$url = ‘www.’ . $url;
}

s($_POST[‘keyword’],$url);

$endtime = explode(‘ ‘,microtime());

$end = $endtime[0] + $endtime[1];

echo ‘<hr>’;
echo ‘程序运行时间: ‘;
echo $end – $start;
die();
}

?>

<!DOCTYPE html PUBLIC “-//W3C//DTD XHTML 1.0 Transitional//EN” “http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd”&gt;
<html xmlns=”http://www.w3.org/1999/xhtml”&gt;
<head>
<meta http-equiv=”Content-Type” content=”text/html; charset=gbk” />
<title>抓取排名</title>

</head>

<body>
<form action=”” method=”post”>
<ul>
<li>
<span>关键字:</span><input type=”text” name=”keyword”>
</li>
<li>
<span>url地址:</span><input type=”text” name=”url”>
</li>
<li>
<input type=”submit” name=”submit” value=”搜索”>
</li>
</ul>

</form>
</body>
</html>

分类:PHP, SEO 标签:, ,
  1. 还没有评论。
  1. No trackbacks yet.

发表评论

Fill in your details below or click an icon to log in:

WordPress.com Logo

You are commenting using your WordPress.com account. Log Out / 更改 )

Twitter picture

You are commenting using your Twitter account. Log Out / 更改 )

Facebook photo

You are commenting using your Facebook account. Log Out / 更改 )

Google+ photo

You are commenting using your Google+ account. Log Out / 更改 )

Connecting to %s

%d 博主赞过: