- 论坛徽章:
- 1
|
本帖最后由 cc7756789w 于 2015-04-20 16:39 编辑
- #!/usr/bin/python
- # -*- encoding:utf-8 -*-
- import urllib
- import urllib2
- import re
- import random
- login_url = ' '
- html = urllib2.urlopen(login_url).read()
- def get_captcha(html):
- reg = r'<img id="captcha_image" src="(.*?)" alt="captcha" class="captcha_image"/>'
- c_reg = re.compile(reg)
- img = re.findall(reg, html)
- for x in img:
- urllib.urlretrieve(x, '%d.jpg' % random.randint(1,1000))
- get_captcha(html)
-
- captcha_id = re.findall(r'<input type="hidden" name="captcha-id" value="(.*?)"/>', html)
- print captcha_id
- captcha = raw_input('Please input captcha: ')
- postdata = urllib.urlencode({
- 'source':'index_nav',
- 'form_email':'xx@qq.com',
- 'form_password':'77xxxw',
- 'captcha-solution':captcha,
- 'captcha-id':captcha_id,
- 'user_login':'登录',
- })
- head = {
- 'User-Agent':'Mozilla/5.0 (Windows NT 6.1; WOW64)\
- AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2272.118 Safari/537.36',
- }
- req = urllib2.Request(
- url = login_url,
- data = postdata,
- headers = head
- )
- result = urllib2.urlopen(req).read()
- with open('a.html', 'w+') as f:
- f.write(result)
复制代码 |
|