curl模拟带验证码的登录
首先说明,不是用php自动识别验证码,而是有验证码的情况下,让你通过curl 带着cookies去请求远程资源,从而通过合法的身份验证。主要用来抓取需要登录后才能访问的资源。
思路就是获取到验证码之后把验证码存储为一个图片,然后程序休眠20秒,在20秒之后由用户手动查看图片,并把验证码填写到code.txt文件中,20秒休眠完成后,程序会读code.txt的验证码,这样再带着验证码进行登录操作。
示例代码如下:
//初始化变量 $cookie_file = "tmp.cookie"; $login_url = "http://xxx.com/logon.php"; $verify_code_url = "http://xxx.com/verifyCode.php"; echo "正在获取COOKIE...n"; $curlj = curl_init(); $timeout = 5; curl_setopt($curl, CURLOPT_URL, $login_url); curl_setopt($curl, CURLOPT_RETURNTRANSFER, 1); curl_setopt($curl, CURLOPT_CONNECTTIMEOUT, $timeout); curl_setopt($curl,CURLOPT_COOKIEJAR,$cookie_file); //获取COOKIE并存储 $contents = curl_exec($curl); curl_close($curl); echo "COOKIE获取完成,正在取验证码...n"; //取出验证码 www.111cn.net $curl = curl_init(); curl_setopt($curl, CURLOPT_URL, $verify_code_url); curl_setopt($curl, CURLOPT_COOKIEFILE, $cookie_file); curl_setopt($curl, CURLOPT_HEADER, 0); curl_setopt($curl, CURLOPT_RETURNTRANSFER, 1); $img = curl_exec($curl); curl_close($curl); $fp = fopen("verifyCode.jpg","w"); fwrite($fp,$img); fclose($fp); echo "验证码取出完成,正在休眠,20秒内请把验证码填入code.txt并保存n"; //停止运行20秒 sleep(20); echo "休眠完成,开始取验证码...n"; $code = file_get_contents("code.txt"); echo "验证码成功取出:$coden"; echo "正在准备模拟登录...n"; $post = "username=maben&pwd=hahahaha&verifycode=$code"; $curl = curl_init(); curl_setopt($curl, CURLOPT_URL, $url); curl_setopt($curl, CURLOPT_HEADER, false); curl_setopt($curl, CURLOPT_RETURNTRANSFER,1); curl_setopt($curl, CURLOPT_POSTFIELDS, $post); curl_setopt($curl, CURLOPT_COOKIEFILE, $cookie_file); $result=curl_exec($curl); curl_close($curl); //这一块根据自己抓包获取到的网站上的数据来做判断 if(substr_count($result,"登录成功")){ echo "登录成功n"; }else{ echo "登录失败n"; exit; } //啦啦啦,开始做你想做的事吧。。。。。