91av视频/亚洲h视频/操亚洲美女/外国一级黄色毛片 - 国产三级三级三级三级

  • 大小: 7KB
    文件類型: .zip
    金幣: 2
    下載: 0 次
    發布日期: 2021-05-28
  • 語言: 其他
  • 標簽: svm??lda??文本分類??

資源簡介

簡易有效的文本分類

資源截圖

代碼片段和文件信息

from?sklearn?import?svm?metrics
from?sklearn.datasets?import?load_svmlight_file
import?sys

#?返回precision?recall?f1?accuracy
def?getScores(?true_classes?pred_classes?average):
????precision?=?metrics.precision_score(?true_classes?pred_classes?average=average?)
????recall?=?metrics.recall_score(?true_classes?pred_classes?average=average?)
????f1?=?metrics.f1_score(?true_classes?pred_classes?average=average?)
????accuracy?=?metrics.accuracy_score(?true_classes?pred_classes?)
????return?precision?recall?f1?accuracy

#?命令行:?python?classEval.py?語料名?文件類型(lda?bow等等)
corpus?=?sys.argv[1]
filetype?=?sys.argv[2]
#?(可選)可指定只使用一部分特征
#?selected?feature?dimensions?can?be?specified?in?the?last?argument?as:
#?1-400?(starting?from?1)
if?len(sys.argv)?>?3:
????dims?=?sys.argv[3].split(“-“)
????dims[0]?=?int(dims[0])?-?1
????dims[1]?=?int(dims[1])
else:
????dims?=?None

#?按照模板,拿到training和test文件名
if?corpus?==?‘20news‘:
????train_file?=?“20news-train-11314.svm-%s.txt“?%filetype
????test_file?=?“20news-test-7532.svm-%s.txt“?%filetype
else:
????train_file?=?“reuters-train-5770.svm-%s.txt“?%filetype
????test_file?=?“reuters-test-2255.svm-%s.txt“?%filetype

#?加載training和test文件的特征
train_features_sparse?true_train_classes?=?load_svmlight_file(train_file)
test_features_sparse?true_test_classes?=?load_svmlight_file(test_file)

#?缺省加載為稀疏矩陣。轉化為普通numpy?array
train_features?=?train_features_sparse.toarray()
test_features?=?test_features_sparse.toarray()

print?“Train:?%dx%d.?Test:?%dx%d“?%(?tuple(?train_features.shape?+?test_features.shape?)?)

if?dims:
????train_features?=?train_features[?:?dims[0]:dims[1]?]
????test_features?=?test_features[?:?dims[0]:dims[1]?]
????print?“Choose?only?features?%d-%d“?%(?dims[0]+1?dims[1]?)
else:
????train_features?=?train_features[?:?:?]
????test_features?=?test_features[?:?:?]

#?線性SVM,L1正則
model?=?svm.LinearSVC(penalty=‘l1‘?dual=False)

#?在training文件上訓練
print?“Training...“
model.fit(?train_features?true_train_classes?)
print?“Done.“

#?在test文件上做預測
pred_train_classes?=?model.predict(?train_features?)
pred_test_classes?=?model.predict(?test_features?)

#?匯報結果
print?metrics.classification_report(true_train_classes?pred_train_classes?digits=3)
print?metrics.classification_report(true_test_classes?pred_test_classes?digits=3)

for?average?in?[‘micro‘?‘macro‘]:
????train_precision?train_recall?train_f1?train_acc?=?getScores(?true_train_classes?pred_train_classes?average?)
????print?“Train?Prec?(%s?average):?%.3f?recall:?%.3f?F1:?%.3f?Acc:?%.3f“?%(?average
????????????????????????train_precision?train_recall?train_f1?train_acc?)

????test_precision?test_recall?test_f1?test_acc?=?getScores(?true_test_classes?pred_test_classes?average?)
????print?“Test?Prec?(%s?average):?%.3f?recall:?%.3f?F1:?%.3f?Acc:?%.3f“?%(??average
????????????????????????test_precision?test_recall?test_f1?test_acc?)

?屬性????????????大小?????日期????時間???名稱
-----------?---------??----------?-----??----
?????目錄???????????0??2017-02-27?17:39??lda_classifier\
?????文件????????3055??2017-02-27?17:39??lda_classifier\classEval.py
?????文件????????7381??2017-02-27?17:39??lda_classifier\corpusLoader.py
?????文件????????4563??2017-02-27?17:39??lda_classifier\ldaExp.py
?????文件?????????795??2017-02-27?17:39??lda_classifier\README.md

評論

共有 條評論