資源簡介
python爬蟲登錄小木蟲論壇爬取交友信息,需登錄兩次,第二次要回答一個簡單的問題,見源代碼
session = requests.session()
g = session.get('http://muchong.com/bbs/logging.php?action=login')
g.headers = {"User-Agent", "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/54.0.2840.100 Safari/537.36"}
se = re.s
代碼片段和文件信息
#coding:utf-8
import?requests
import?re
from?bs4?import?BeautifulSoup
if?__name__?==?“__main__“:
????
????session?=?requests.session()
????g?=?session.get(‘http://muchong.com/bbs/logging.php?action=login‘)
????g.headers?=?{“User-Agent“?“Mozilla/5.0?(X11;?Linux?x86_64)?AppleWebKit/537.36?(KHTML?like?Gecko)?Chrome/54.0.2840.100?Safari/537.36“}
????se?=?re.search(re.compile(r‘a(chǎn)ction=login&t=(.*?)“>登錄‘)?g.text)
????urls?=?r‘http://muchong.com/bbs/logging.php?action=login&t=‘?+?se.group(1)
????se?=?re.search(re.compile(r‘name=“l(fā)oginsubmit“?value=“(.*?)“?class‘)?g.text)
????loginsubmit?=?se.group(1)
????login_infor?=?{
????‘formhash‘:?“46295093“
????‘username‘:?“xxxxxx“
????‘password‘:?“xxxxxx“
????‘cookietime‘:?“31536000“
????‘refer‘:““
????‘loginsubmit‘:?“會員登錄“
????}
????p?=?session
評論
共有 條評論