91av视频/亚洲h视频/操亚洲美女/外国一级黄色毛片 - 国产三级三级三级三级

  • 大小:
    文件類型: .zip
    金幣: 2
    下載: 1 次
    發(fā)布日期: 2023-09-25
  • 語言: 其他
  • 標(biāo)簽: python??

資源簡介

資源截圖

代碼片段和文件信息

import?random
import?re
import?traceback

import?jieba
import?numpy?as?np
from?sklearn.externals?import?joblib
from?sklearn.naive_bayes?import?MultinomialNB

jieba.load_userdict(“train/word.txt“)
stop?=?[line.strip()?for?line?in?open(‘a(chǎn)d/stop.txt‘?‘r‘?encoding=‘utf-8‘).readlines()]??#?停用詞


def?build_key_word(path):??#?通過詞頻產(chǎn)生特征
????d?=?{}
????with?open(path?encoding=“utf-8“)?as?fp:
????????for?line?in?fp:
????????????for?word?in?jieba.cut(line.strip()):
????????????????p?=?re.compile(r‘\w‘?re.L)
????????????????result?=?p.sub(““?word)
????????????????if?not?result?or?result?==?‘?‘:??#?空字符
????????????????????continue
????????????????if?len(word)?>?1:??#?避免大量無意義的詞語進(jìn)入統(tǒng)計(jì)范圍
????????????????????d[word]?=?d.get(word?0)?+?1
????kw_list?=?sorted(d?key=lambda?x:?d[x]?reverse=True)
????size?=?int(len(kw_list)?*?0.2)??#?取最前的30%
????mood?=?set(kw_list[:size])
????return?list(mood?-?set(stop))


def?loadDataSet(path):??#?返回每條微博的分詞與標(biāo)簽
????line_cut?=?[]
????label?=?[]
????with?open(path?encoding=“utf-8“)?as?fp:
????????for?line?in?fp:
????????????temp?=?line.strip()
????????????try:
????????????????sentence?=?temp[2:].lstrip()??#?每條微博
????????????????label.append(int(temp[:2]))??#?獲取標(biāo)注
????????????????word_list?=?[]
????????????????sentence?=?str(sentence).replace(‘\u200b‘?‘‘)
????????????????for?word?in?jieba.cut(sentence.strip()):
????????????????????p?=?re.compile(r‘\w‘?re.L)
????????????????????result?=?p.sub(““?word)
????????????????????if?not?result?or?result?==?‘?‘:??#?空字符
????????????????????????continue
????????????????????word_list.append(word)
????????????????word_list?=?list(set(word_list)?-?set(stop)?-?set(‘\u200b‘)
?????????????????????????????????-?set(‘?‘)?-?set(‘\u3000‘)?-?set(‘?‘))
????????????????line_cut.append(word_list)
????????????except?Exception:
????????????????continue
????return?line_cut?label??#?返回每條微博的分詞和標(biāo)注


def?setOfWordsToVecTor(vocabularyList?moodWords):??#?每條微博向量化
????vocabMarked?=?[0]?*?len(vocabularyList)
????for?smsWord?in?moodWords:
????????if?smsWord?in?vocabularyList:
????????????vocabMarked[vocabularyList.index(smsWord)]?+=?1
????return?np.array(vocabMarked)


def?setOfWordsListToVecTor(vocabularyList?train_mood_array):??#?將所有微博準(zhǔn)備向量化
????vocabMarkedList?=?[]
????for?i?in?range(len(train_mood_array)):
????????vocabMarked?=?setOfWordsToVecTor(vocabularyList?train_mood_array[i])
????????vocabMarkedList.append(vocabMarked)
????return?vocabMarkedList


def?trainingNaiveBayes(train_mood_array?label):??#?計(jì)算先驗(yàn)概率
????numTrainDoc?=?len(train_mood_array)
????numWords?=?len(train_mood_array[0])
????prior_Pos?prior_Neg?prior_Neutral?=?0.0?0.0?0.0
????for?i?in?label:
????????if?i?==?1:
????????????prior_Pos?=?prior_Pos?+?1
????????elif?i?==?2:
????????????prior_Neg?=?prior_Neg?+?1
????????else:
????????????prior_Neutral?=?prior_Neutral?+?1
????prior_Pos?=?prior_Pos?/?float(numTrainDoc)
????prior_Neg?=?prior_Neg?/?float(numTrainDoc)
????prior_Neutral?=?prior_Neutral?/?float(numTrainDoc)
????wordsInPosNum?=?np.ones

?屬性????????????大小?????日期????時(shí)間???名稱
-----------?---------??----------?-----??----
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\
?????文件????????6977??2017-12-17?09:54??weiboanalysis-master\Bayes.py
?????文件???????11357??2017-12-17?09:54??weiboanalysis-master\LICENSE
?????文件????????1765??2017-12-17?09:54??weiboanalysis-master\README.md
?????文件????????3357??2017-12-17?09:54??weiboanalysis-master\SVM.py
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\ad\
?????文件???????45522??2017-12-17?09:54??weiboanalysis-master\ad\advertise.txt
?????文件???????66038??2017-12-17?09:54??weiboanalysis-master\ad\normal.txt
?????文件???????13407??2017-12-17?09:54??weiboanalysis-master\ad\stop.txt
?????文件??????????79??2017-12-17?09:54??weiboanalysis-master\ad\train.txt
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\doc\
?????文件?????1295601??2017-12-17?09:54??weiboanalysis-master\doc\基于AdaBoost算法的情感分析研究.docx
?????文件????????2385??2017-12-17?09:54??weiboanalysis-master\draw_pic.py
?????文件?????????347??2017-12-17?09:54??weiboanalysis-master\from_database.py
?????文件?????????749??2017-12-17?09:54??weiboanalysis-master\jiebatest.py
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\model\
?????文件?????????539??2017-12-17?09:54??weiboanalysis-master\model\gnb.model
?????文件??????????92??2017-12-17?09:54??weiboanalysis-master\model\gnb.model_01.npy
?????文件?????????104??2017-12-17?09:54??weiboanalysis-master\model\gnb.model_02.npy
?????文件????????7352??2017-12-17?09:54??weiboanalysis-master\model\gnb.model_03.npy
?????文件?????????104??2017-12-17?09:54??weiboanalysis-master\model\gnb.model_04.npy
?????文件????????7352??2017-12-17?09:54??weiboanalysis-master\model\gnb.model_05.npy
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\multi_AdaBoost\
?????文件????????7951??2017-12-17?09:54??weiboanalysis-master\multi_AdaBoost\Bayes.py
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\multi_AdaBoost\model\
?????文件???????15554??2017-12-17?09:54??weiboanalysis-master\multi_AdaBoost\model\gnb.model
?????文件????????2635??2017-12-17?09:54??weiboanalysis-master\multi_AdaBoost\multi_boost.py
?????文件????????4171??2017-12-17?09:54??weiboanalysis-master\multi_AdaBoost\multi_test.py
?????目錄???????????0??2017-12-17?09:54??weiboanalysis-master\ntusd\
?????文件???????80818??2017-12-17?09:54??weiboanalysis-master\ntusd\ntusd-negative.txt
?????文件???????26508??2017-12-17?09:54??weiboanalysis-master\ntusd\ntusd-positive.txt
............此處省略54個(gè)文件信息

評論

共有 條評論