- 論壇徽章:
- 0
|
[PHP]代碼- <?php
- //error_reporting(0);
- $date=date("Ymd");
- //echo $date;
- $url="http://top.finance.sina.com.cn/ws/GetTopDataList.php?top_type=day&top_cat=all&top_time=".$date."&top_show_num=20&top_order=ASC";
- $doc=file_get_contents($url);
- header("Content-Type:text/html;charset=gb2312");//UNICODE轉(zhuǎn)GB2312
- //echo $doc;
- preg_match_all('/"url":".*l/U',$doc,$article);//獲取文章列表
- $article=current($article);//二維數(shù)組轉(zhuǎn)一維數(shù)組
- //print_r($article);
- $rule="/\"url\":(.*)\"\"/";
- function OnlyUrl($string){
- $string=stripslashes($string);
- $string=str_replace('"url":"',"",$string);
- return $string;
- }
-
- function GetTitle($url){ //獲取文章標(biāo)題
- $doc=file_get_contents($url);
- $rule="/<h1 (.*)<\/h1>/";
- preg_match($rule,$doc,$result);
- echo $result;
- }
- foreach($article as &$value){
- $value=OnlyUrl($value);
- }//提取了URL
- ?>
- <?php
- function GetTitle($url){ //獲取文章標(biāo)題
- $rule="/<h1 (.*)<\/h1>/";
- preg_match_all($rule,$doc,$result);
- $rule="/>(.*)</";//截掉<h1></h1>
- preg_match($rule,$result[0][1],$title);
- return $title[1];
- }
- function GetContent($url){
- $doc=file_get_contents($url);//打開網(wǎng)頁
- // echo $doc;
- $rule="/publish_helper(.*)publish_helper_end/xs";
- preg_match($rule,$doc,$result);//取出正文部分
- //echo $result[0];
- $rule="/publish_helper(.*)<\/blockquote>/xs";
- preg_match($rule,$result[0],$out);//取出鏈接部分
- //print_r($out);
- $content=str_replace($out[0],"",$result[0]);//提取純文字段的內(nèi)容
- echo $content;
- }
- ?>
復(fù)制代碼 |
|