利用正则,代码如下:
public function kuaizhaoo() {
$text = '你要搜索的内容';
$url = 'http://www.baidu.com/s?word='.$text;
$html = file_get_contents($url);
// var_dump($html);
$text = str_replace('.','\.',addslashes($text));
$regex = "/<a.?data-click=\"{'rsv_snapshot':'1'}.*?\">(.*?)<\/a>/is";
preg_match($regex,$html,$matches);
$regex1 = "/(href=\").*?(\")/i";
preg_match($regex1,$matches[0],$matches1);
// var_dump($matches1[0]);
$replaceList = array("href=\"","\"");
$url = str_replace($replaceList, "", $matches1[0]);
echo ($url);die();
}
2017-1-16更新:
把file_get_content 换成curl可以提高效率
参见另外一篇博客:http://blog.youkuaiyun.com/qq_28018283/article/details/53337984