Heim > Backend-Entwicklung > PHP-Tutorial > 求php远程抓取代码

求php远程抓取代码

WBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWBOYWB
Freigeben: 2016-06-23 13:43:33
Original
1084 Leute haben es durchsucht



http://www.taodaxiang.com/credit/index/init

这个页面需要post查询后。在抓取查询的数据。这个用php怎么写?求代码


回复讨论(解决方案)

建议你参考一下CURL
百度一下有很多

不行。百度的都抓取失败。

没有人吗?

curl 就可以,不过查询到的信息是通过 app_init.js 动态写入页面的
所以你还需抓取 app_init.js 后自行解析

比如取回的页面中有

<td>注册时间:<p id='info_regtime'></p></td><td>实名认证:<p id='info_auth'></p></td>
Nach dem Login kopieren
app_init.js 中有
$("#info_regtime").html("<span style='color:green'><b>"+data.regtime+"</b></span>");$("#info_auth").html("<span style='color:"+color+"'><b>"+data.auth+"</b></span>");
Nach dem Login kopieren

curl 这个好像不用你说哟。php抓取三种方式,我都试过了。就是抓取失败。所以才来发帖求助

js?入dom的,需要curl後再分析,再curl?取的。

我试了下只能抓取到一个空页面(就一个[] 内容),应该是做了只能本站点提交表单的限制

<?phpclass mycurl {     protected $_useragent = 'Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1';     protected $_url;     protected $_followlocation;     protected $_timeout;     protected $_maxRedirects;     protected $_cookieFileLocation = './cookie.txt';     protected $_post;     protected $_postFields;     protected $_referer ="http://www.taodaxiang.com/credit/index/init";     protected $_session;     protected $_webpage;     protected $_includeHeader;     protected $_noBody;     protected $_status;     protected $_binaryTransfer;     public    $authentication = 0;     public    $auth_name      = '';     public    $auth_pass      = '';     public function useAuth($use){       $this->authentication = 0;       if($use == true) $this->authentication = 1;     }     public function setName($name){       $this->auth_name = $name;     }     public function setPass($pass){       $this->auth_pass = $pass;     }     public function __construct($url,$followlocation = true,$timeOut = 30,$maxRedirecs = 4,$binaryTransfer = false,$includeHeader = false,$noBody = false)     {         $this->_url = $url;         $this->_followlocation = $followlocation;         $this->_timeout = $timeOut;         $this->_maxRedirects = $maxRedirecs;         $this->_noBody = $noBody;         $this->_includeHeader = $includeHeader;         $this->_binaryTransfer = $binaryTransfer;         $this->_cookieFileLocation = dirname(__FILE__).'/cookie.txt';     }     public function setReferer($referer){       $this->_referer = $referer;     }     public function setCookiFileLocation($path)     {         $this->_cookieFileLocation = $path;     }     public function setPost ($postFields)     {        $this->_post = true;        $this->_postFields = $postFields;     }     public function setUserAgent($userAgent)     {         $this->_useragent = $userAgent;     }     public function createCurl($url = 'nul')     {        if($url != 'nul'){          $this->_url = $url;        }         $s = curl_init();         curl_setopt($s,CURLOPT_URL,$this->_url);         curl_setopt($s,CURLOPT_HTTPHEADER,array('Expect:'));         curl_setopt($s,CURLOPT_TIMEOUT,$this->_timeout);         curl_setopt($s,CURLOPT_MAXREDIRS,$this->_maxRedirects);         curl_setopt($s,CURLOPT_RETURNTRANSFER,true);         curl_setopt($s,CURLOPT_FOLLOWLOCATION,$this->_followlocation);         curl_setopt($s,CURLOPT_COOKIEJAR,$this->_cookieFileLocation);         curl_setopt($s,CURLOPT_COOKIEFILE,$this->_cookieFileLocation);         if($this->authentication == 1){           curl_setopt($s, CURLOPT_USERPWD, $this->auth_name.':'.$this->auth_pass);         }         if($this->_post)         {             curl_setopt($s,CURLOPT_POST,true);             curl_setopt($s,CURLOPT_POSTFIELDS,$this->_postFields);         }         if($this->_includeHeader)         {               curl_setopt($s,CURLOPT_HEADER,true);         }         if($this->_noBody)         {             curl_setopt($s,CURLOPT_NOBODY,true);         }         /*         if($this->_binary)         {             curl_setopt($s,CURLOPT_BINARYTRANSFER,true);         }         */         curl_setopt($s,CURLOPT_USERAGENT,$this->_useragent);         curl_setopt($s,CURLOPT_REFERER,$this->_referer);         $this->_webpage = curl_exec($s);                   $this->_status = curl_getinfo($s,CURLINFO_HTTP_CODE);         curl_close($s);     }   public function getHttpStatus()   {       return $this->_status;   }   public function __tostring(){      return $this->_webpage;   }}$m=new mycurl("http://www.taodaxiang.com/credit/index/get");$m->setReferer("http://www.taodaxiang.com/credit/index/init");$m->setPost(Array("account"=>"cupjava"));$m->createCurl();echo $m;?>
Nach dem Login kopieren

json结果出来解析一下就好了

9楼是神人。万分感谢,可以了

Verwandte Etiketten:
Erklärung dieser Website
Der Inhalt dieses Artikels wird freiwillig von Internetnutzern beigesteuert und das Urheberrecht liegt beim ursprünglichen Autor. Diese Website übernimmt keine entsprechende rechtliche Verantwortung. Wenn Sie Inhalte finden, bei denen der Verdacht eines Plagiats oder einer Rechtsverletzung besteht, wenden Sie sich bitte an admin@php.cn
Beliebte Tutorials
Mehr>
Neueste Downloads
Mehr>
Web-Effekte
Quellcode der Website
Website-Materialien
Frontend-Vorlage