用Simple HTML DOM自動查高考分數與錄取情況
- 2019 年 10 月 6 日
- 筆記
這個程式原本是做來給自己用的,免去了查成績的手抖又心跳加速打資訊打錯等各種問題,頁面改動後直接發送郵件到自己的郵箱里,不看也不行→_→哈哈哈 Simple HTML DOM:http://simplehtmldom.sourceforge.net/ 我這裡用的查詢地址是廣州招考的,查詢沒有驗證碼,沒有了驗證碼識別的問題。

先模擬一次提交,找到提交數據。

用Curl模擬提交
$cookie_file = tempnam("tmp","cookie"); function postData($url, $data) { global $cookie_file; $ch = curl_init(); $timeout = 300; curl_setopt($ch, CURLOPT_URL, $url); curl_setopt($ch, CURLOPT_POST, true); curl_setopt($ch, CURLOPT_POSTFIELDS, $data); curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1); curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, $timeout); curl_setopt($ch, CURLOPT_COOKIEJAR, $cookie_file); $handles = curl_exec($ch); curl_close($ch); return $handles; } $contents = file_get_contents("http://gaokao.gzzk.cn/mopub_login3.aspx"); $html = str_get_html($contents); $__VIEWSTATE = $html->find('#__VIEWSTATE',0)->attr['value']; $__VIEWSTATEGENERATOR = $html->find('#__VIEWSTATEGENERATOR',0)->attr['value']; $__EVENTVALIDATION = $html->find('#__EVENTVALIDATION',0)->attr['value']; $url='http://gaokao.gzzk.cn/mopub_login3.aspx'; $argv = array( '__EVENTTARGET' => "LoginButton", '__EVENTARGUMENT' => "", '__VIEWSTATE' => $__VIEWSTATE, '__VIEWSTATEGENERATOR' => $__VIEWSTATEGENERATOR, '__EVENTVALIDATION' => $__EVENTVALIDATION, 'text_biaoshi' => "", //考號 'text_mima' => '' //密碼 ); $rdata = postData($url, $argv);
測試發現還有來源驗證。。於是postData函數多加一行設置Referer。
測試成功,還有一層跳轉

圖中的鏈接對應結果頁。
$html2 = str_get_html($rdata); $newurl = "http://gaokao.gzzk.cn" . $html2->find('a',0)->attr['href']; $contents2 = getData($newurl); 
成功!再把成績表格選取出來,並添加MD5驗證,如果MD5沒有變,則每隔5秒刷新,在頁面改動後,把這個選取出來的表格作為郵件正文發送到我的郵箱即可。
$html3 = str_get_html($contents2); $result = $html3->find('#td_center',0)->innertext; echo $result; //result -> 成績表格
完整源碼
<html> <head> <meta http-equiv="content-type" content="text/html;charset=utf-8"> </head> <body> <?php $cookie_file = tempnam("tmp","cookie"); function postData($url, $data) { global $cookie_file; $ch = curl_init(); $timeout = 300; curl_setopt($ch, CURLOPT_URL, $url); curl_setopt($ch, CURLOPT_REFERER, "http://gaokao.gzzk.cn/mopub_login3.aspx"); curl_setopt($ch, CURLOPT_POST, true); curl_setopt($ch, CURLOPT_POSTFIELDS, $data); curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1); curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, $timeout); curl_setopt($ch, CURLOPT_COOKIEJAR, $cookie_file); $handles = curl_exec($ch); curl_close($ch); return $handles; } function getData($url) { global $cookie_file; $ch = curl_init(); $timeout = 300; curl_setopt($ch, CURLOPT_URL, $url); curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1); curl_setopt($ch, CURLOPT_HEADER, 0); curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, $timeout); curl_setopt($ch, CURLOPT_COOKIEFILE, $cookie_file); $handles = curl_exec($ch); curl_close($ch); return $handles; } include("simple_html_dom.php"); $contents = file_get_contents("http://gaokao.gzzk.cn/mopub_login3.aspx"); $html = str_get_html($contents); $__VIEWSTATE = $html->find('#__VIEWSTATE',0)->attr['value']; $__VIEWSTATEGENERATOR = $html->find('#__VIEWSTATEGENERATOR',0)->attr['value']; $__EVENTVALIDATION = $html->find('#__EVENTVALIDATION',0)->attr['value']; $url='http://gaokao.gzzk.cn/mopub_login3.aspx'; $argv = array( '__EVENTTARGET' => "LoginButton", '__EVENTARGUMENT' => "", '__VIEWSTATE' => $__VIEWSTATE, '__VIEWSTATEGENERATOR' => $__VIEWSTATEGENERATOR, '__EVENTVALIDATION' => $__EVENTVALIDATION, 'text_biaoshi' => "", //考號 'text_mima' => '' //密碼 ); $rdata = postData($url, $argv); $html2 = str_get_html($rdata); $newurl = "http://gaokao.gzzk.cn" . $html2->find('a',0)->attr['href']; $contents2 = getData($newurl); $html3 = str_get_html($contents2); $result = $html3->find('#td_center',0)->innertext; echo $result; //result -> 成績表格 $originmd5 = ""; //成績出來前的td_center的MD5 $currentmd5 = md5($result); if($currentmd5 != $originmd5) { echo "頁面發生改動!"; $tablelist = $html3->find('#table_list',0)->innertext; $html4 = str_get_html($tablelist); $totalmark = $html4->find('td.mytdfenge1',23)->innertext; //算總分 //DO STH } else { echo '<meta http-equiv="refresh" content="5;url=checker.php">'; } ?> </body> </html>