php curl 登录163邮箱并抓取邮箱好友列表的代码(经测试) |
本文标签:php,curl,163邮箱 CURL技术说白了就是模拟浏览器的动作实现页面抓取或表单提交,通过此技术可以实现许多有去的功能 。 复制代码 代码如下: <?php error_reporting(0); //邮箱用户名(不带@163.com后缀的) $user = papatata_test; //邮箱密码 $pass = 000000; //目标邮箱 //$mail_addr = uenucom@163.com; //登陆 $url = http://reg.163.com/logins.jsp?type=1&url=http://entry.mail.163.com/coremail/fcg/ntesdoor2?lightweight%3D1%26verifycookie%3D1%26language%3D-1%26style%3D-1; $ch = curl_init($url); //创建一个用于存放cookie信息的临时文件 $cookie = tempnam(.,'); $referer_login = http://mail.163.com; //返回结果存放在变量中,而不是默认的直接输出 curl_setopt($ch, CURLOPT_RETURNTRANSFER, true); curl_setopt($ch, CURLOPT_HEADER, true); curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, 120); curl_setopt($ch, CURLOPT_POST, true); curl_setopt($ch, CURLOPT_REFERER, $referer_login); $fields_post = array( username=> $user, password=> $pass, verifycookie=>1, style=>-1, product=> mail163, selType=>-1, secure=>on ); $headers_login = array( User-Agent => Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9) Gecko/2008052906 Firefox/3.0, Referer => http://www.163.com ); $fields_string = ; foreach($fields_post as $key => $value) { $fields_string .= $key . = . $value . &; } $fields_string = rtrim($fields_string , &); curl_setopt($ch, CURLOPT_COOKIESESSION, true); //关闭连接时,将服务器端返回的cookie保存在以下文件中 curl_setopt($ch, CURLOPT_COOKIEJAR, $cookie); curl_setopt($ch, CURLOPT_HTTPHEADER, $headers_login); curl_setopt($ch, CURLOPT_POST, count($fields)); curl_setopt($ch, CURLOPT_POSTFIELDS, $fields_string); $result= curl_exec($ch); curl_close($ch); //跳转 $url=http://entry.mail.163.com/coremail/fcg/ntesdoor2?lightweight=1&verifycookie=1&language=-1&style=-1&username=loki_wuxi; $ch = curl_init($url); $headers = array( User-Agent => Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9) Gecko/2008052906 Firefox/3.0 ); curl_setopt($ch, CURLOPT_RETURNTRANSFER, true); curl_setopt($ch, CURLOPT_HEADER, true); curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, 120); curl_setopt($ch, CURLOPT_POST, true); curl_setopt($ch, CURLOPT_HTTPHEADER, $headers); //将之前保存的cookie信息,一起发送到服务器端 curl_setopt($ch, CURLOPT_COOKIEFILE, $cookie); curl_setopt($ch, CURLOPT_COOKIEJAR, $cookie); $result = curl_exec($ch); curl_close($ch); //取得sid preg_match(/sid=[^\"].*/, $result, $location); $sid = substr($location[0], 4, -1); //file_put_contents(./result.txt, $sid); //通讯录地址 $url=http://g4a30.mail.163.com/jy3/address/addrlist.jsp?sid=.$sid.&gid=all; $ch = curl_init($url); $headers = array( User-Agent => Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9) Gecko/2008052906 Firefox/3.0 ); curl_setopt($ch, CURLOPT_RETURNTRANSFER, true); curl_setopt($ch, CURLOPT_HEADER, true); curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, 120); curl_setopt($ch, CURLOPT_POST, true); curl_setopt($ch, CURLOPT_HTTPHEADER, $headers); curl_setopt($ch, CURLOPT_COOKIEFILE, $cookie); curl_setopt($ch, CURLOPT_COOKIEJAR, $cookie); $result = curl_exec($ch); curl_close($ch); //file_put_contents(./result.txt, $result); unlink($cookie); //开始抓取内容 preg_match_all(/<td class="Ibx_Td_addrName"><a[^>]*>(.*?)<\/a><\/td><td class="Ibx_Td_addrEmail"><a[^>]*>(.*?)<\/a><\/td>/i, $result,$infos,PREG_SET_ORDER); //1:姓名2:邮箱 print_r($infos); ?> |