admin 管理员组文章数量: 1184232
2024年3月7日发(作者:graphics 730)
import urllib2import urllibimport reimport pytesserimport StringIOimport Imageimport cookielibimport chardetimport timeclass ScoreCrawl(object): def __init__(self , username = "*******" ,password='******'): me = username rd = password rl ='/?exit=1' rl ='/Public/?image=1052561647' Jar = Jar() httpHandler = ndler(debuglevel=1)
httpsHandler = andler(debuglevel=1)
= _opener(okieProcessor(Jar),httpHandler, httpsHandler) =[]
def getImageCodeAndCookie(self): try: im = (rl).read() #获取验证码和cookies值 img_buffer = IO(im) img = (img_buffer) textcode = _to_string(img) print 'Cookies:'
for item in Jar: if =='_SessionId': nId = print ' Name = '+ print ' Value = '+
print 'ImageCode=',textcode return textcode except Exception as e: print 'Failed to get imagecode!', e return '' def login(self): postdata ={ 'UserName':me, 'PassWord':rd, 'drpLoginType':1, 'ScriptManager1':'UpdatePanel2|btLogin', '__EVENTTARGET':'btLogin', rl ='/Gstudent/Course/?EID=l0RCAjrC!60Alnrcjky12Ad6vU4OJDrqYylAGKDjRFO3OCFxhesOvg==& '__VIEWSTATE':'''/wEPDwULLTE3MzIzNjYwNjMPZBYCAgMPZBYGAg0PZBYCZg9kFgICAQ8PFgIeCEltYWdlVXJsBSp+L1B1YmxpYy9WYWxpZGF0Z '__ASYNCPOST':'true' } code = geCodeAndCookie() postdata['ValidateCode']=code[:4] print 'postdata:',postdata postdata=ode(postdata) # POST的数据 myRequest = t(url = rl,data = postdata) _header('Accept','*/*')# _header('Content-Length','792') _header('Accept-Encoding','gzip,deflate,sdch') _header('Accept-Language','zh-CN,zh;q=0.8') _header('Cache-Control','no-cache') _header('Connection','keep-alive') _header('Content-Type','application/x-www-form-urlencoded; charset=UTF-8')# _header('Cookie:LoginType','LoginType=1; _SessionId='+ nId) _header('Host','') _header('Origin','') _header('Referer','/?exit=1') '__EVENTVALIDATION':'/wEdAApk+MhPeRcW7LbXAbrLM7jrR1LBKX1P1xh290RQyTesRQa+ROBMEf7egV772v+RsRJUvPovksJgUuQnp+WD/+4LQ
版权声明:本文标题:python爬虫实例-爬取北邮研究生成绩 内容由网友自发贡献,该文观点仅代表作者本人, 转载请联系作者并注明出处:http://www.roclinux.cn/p/1709807038a547053.html, 本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如发现本站有涉嫌抄袭侵权/违法违规的内容,一经查实,本站将立刻删除。
发表评论