91av视频/亚洲h视频/操亚洲美女/外国一级黄色毛片 - 国产三级三级三级三级

  • 大小: 2.71MB
    文件類型: .zip
    金幣: 2
    下載: 1 次
    發布日期: 2021-04-09
  • 語言: Python
  • 標簽: python??爬蟲??

資源簡介

python爬蟲,并將數據進行可視化分析,數據可視化包含餅圖、柱狀圖、漏斗圖、詞云、另附源代碼和報告書。

資源截圖

代碼片段和文件信息

import?tkinter?as?tk
import?time
from?tkinter?import?*
from?tkinter?import?messagebox
import?string
import?pickle
import?random
import?requests
from?bs4?import?BeautifulSoup
import?os
import?jieba
from?pyecharts.charts?import?Bar
from?pyecharts.charts?import?Pie
from?pyecharts.charts?import?Funnel
from?pyecharts.charts?import?Page?WordCloud
from?pyecharts?import?options?as?opts
from?pyecharts.globals?import?SymbolType
from?pyecharts.globals?import?ThemeType
headers?=?{
????‘Upgrade-Insecure-Requests‘:?‘1‘
????‘User-Agent‘:?‘Mozilla/5.0?(Windows?NT?10.0;?Win64;?x64)?AppleWebKit/537.36?(KHTML?like?Gecko)?Chrome/72.0.3626.119?Safari/537.36‘
????‘Accept-Encoding‘:?‘gzip?deflate‘
????‘Accept-Language‘:?‘zh-CNzh;q=0.9en;q=0.8‘
????‘Cache-Control‘:?‘no-cache‘
????‘Connection‘:?‘keep-alive‘
????‘Host‘:?‘search.dangdang.com‘
}
def?parseHtml(html):
????data?=?{}
????#print(html)
????soup?=?BeautifulSoup(html?‘lxml‘)
????conshoplist?=?soup.find_all(‘div‘?{‘class‘:?‘con?shoplist‘})[0]
????
????for?each?in?conshoplist.find_all(‘li‘):
????????#?書名
????????bookname?=?each.find_all(‘a‘)[0].get(‘title‘).strip(‘?‘)
????????#?書圖
????????img_src?=?each.find_all(‘a‘)[0].img.get(‘data-original‘)
????????if?img_src?is?None:
????????????img_src?=?each.find_all(‘a‘)[0].img.get(‘src‘)
????????img_src?=?img_src.strip(‘?‘)
????????#?價格
????????price?=?float(each.find_all(‘p‘?{‘class‘:?‘price‘})[0].span.text[1:])
????????#?簡介
????????detail?=?each.find_all(‘p‘?{‘class‘:?‘detail‘})[0].text
????????#?評分
????????stars?=?float(each.find_all(‘p‘?{‘class‘:?‘search_star_line‘})[0].span.span.get(‘style‘).split(‘:?‘)[-1].strip(‘%;‘))?/?20
????????#?評論數量
????????num_comments?=?float(each.find_all(‘p‘?{‘class‘:?‘search_star_line‘})[0].a.text[:-3])
????????data[bookname]?=?[img_src?price?detail?stars?num_comments]
????return?data
def?create():
????global?keyword
????global?num_page
????keyword?=?text_var.get()
????top?=?Toplevel()
????top.title(‘Python‘)
????#top.geometry(‘850x150‘)
????img1?=?tk.PhotoImage(file=“bg.gif“)
????v?=?tk.StringVar()
????label_1?=?tk.Label(top?textvariable=v?fg=“red“?bg=“black“?font=(“黑體“?20))
????label_1.pack()

????url?=?‘http://search.dangdang.com/?key={}&act=input&page_index={}‘
????results?=?{}
????cnt?=?0
????num_page?=?0
????while?True:
????????cnt?+=?1
????????if?cnt?>?5:
????????????break
????????num_page?+=?1
????????v.set(‘[INFO]:?Start?to?get?the?data?of?page%d...‘?%?num_page)
????????label_1.update()
????????time.sleep(3)
????????page_url??=?url.format(keyword?num_page)
????????res?=?requests.get(page_url?headers=headers)
????????if?‘抱歉,沒有找到與“%s”相關的商品,建議適當減少篩選條件‘?%?keyword?in?res.text:
????????????break
????????page_data?=?parseHtml(res.text)
????????results.update(page_data)
????????

????messagebox.showinfo(?“Python爬蟲“?“爬蟲已完成“)
????with?open(‘%s_%d.pkl‘?%?(keyword?num_page-1)?‘wb‘)?as?f:
????????pickle.dump(results?f)

????labe

?屬性????????????大小?????日期????時間???名稱
-----------?---------??----------?-----??----
?????文件????????9723??2020-06-12?15:28??python代碼\Reptile+Pyecharts.py
?????文件??????270140??2019-12-29?21:00??python代碼\bg.gif
?????文件???????96863??2019-12-30?15:07??python代碼\nyist.gif
?????文件?????2476375??2020-06-12?15:35??python代碼\python數據可視化分析大作業.docx
?????文件???????20270??2019-12-22?18:17??python代碼\stopwords.txt
?????目錄???????????0??2020-06-12?15:35??python代碼\

評論

共有 條評論