資源簡介
代碼片段和文件信息
import?requests
from?lxml?import?etree
import?re
import?os
from?multiprocessing.dummy?import?Pool?as?ThreadPool
?
def?gethtml(urlencode):?#獲取網頁源碼
????r?=?requests.get(url)
????r.encoding?=?encode
????return?r.text
?
def?filterFName(FName):?#文件名過濾特殊字符
????rstr?=?r“[\/\\\:\*\?\“\<\>\|]“
????new_name?=?re.sub(rstr?“_“?FName)
????return?new_name
?
def?mkdir(path):?#創建文件夾
????path?=?path.strip()
????isExists?=?os.path.exists(path)
????if?not?isExists:
????????os.makedirs(path)
?
def?geturl(url):?#獲取網站各個分類鏈接、分類名稱
????html?=?gethtml(url‘utf-8‘)
????ehtml?=?etree.HTML(html)
????nurl?=?ehtml.xpath(‘//*[@id=“chenxing_menu“]/li/a/@href‘)
????ntitle?=?ehtml.xpath(‘//*[@id=“chenxing_menu“]/li/a/text()‘)
????urldata=[]
????for?i?in?range(1len(nurl)-1):
????????urldata.a
- 上一篇:《Python和Pygame游戲開發指南》隨書源碼
- 下一篇:python百度圖片
評論
共有 條評論