91av视频/亚洲h视频/操亚洲美女/外国一级黄色毛片 - 国产三级三级三级三级

資源簡(jiǎn)介

df算法,通過在訓(xùn)練集中提取詞語(yǔ),比較出現(xiàn)次數(shù),進(jìn)行特征詞的提取。 這個(gè)代碼是提取兩個(gè)特征的特征詞,可修改main函數(shù)中(直接刪除一部分)(有詳細(xì)注釋),提取一個(gè)類的特征。此程序編譯過,無錯(cuò)。

資源截圖

代碼片段和文件信息

package?df;

import?java.io.BufferedReader;
import?java.io.BufferedWriter;
import?java.io.File;
import?java.io.FileInputStream;
import?java.io.FileNotFoundException;
import?java.io.FileOutputStream;
import?java.io.InputStreamReader;
import?java.io.OutputStreamWriter;
import?java.nio.CharBuffer;

public?class?dfb?{


public?static?void?main(String[]?args)?{
String[]?temp?=?new?String[1024];//所有詞語(yǔ)存的數(shù)組
int?[]?w?;?//用來記錄每個(gè)詞的權(quán)重
int?k=100;?//取權(quán)重最高的前K個(gè)feature
String?termWeighFile=“termWeigh.txt“;??//用于保存全部《特征?,權(quán)重》對(duì)
String?topFeatureFile=“Feature.txt“;??//保存前k個(gè)《特征?,權(quán)重》對(duì)
String?termnonum=“Featrueno.txt“;//保存《特征》
String?dirName=“D:\\2013fall\\數(shù)字內(nèi)容安全實(shí)驗(yàn)\\3\\訓(xùn)練集\\汽車\\“;??//存放所有語(yǔ)料集的目錄地址,如C://
//初始化w
????w=new?int[1024];

????//把語(yǔ)料集全部列出來
File?dir?=?new?File(dirName);??
File[]?files?=?dir.listFiles();?
//總結(jié)所有詞匯
remwords(fileswtemp);
//刪除干擾詞
for(int?a=0;a if(IsStopWord(temp[a])){
delet(?tempa?w);

}
}

//輸出《特征,權(quán)重》對(duì)
try?{
FileOutputStream?fos?=?new?FileOutputStream(termWeighFile);
OutputStreamWriter?osw?=?new?OutputStreamWriter(fos);
BufferedWriter?bw?=?new?BufferedWriter(osw);
for(int?i=0;i bw.write(temp[i]+“??“);
bw.write(String.valueOf(w[i]));
bw.newLine();
}
bw.close();
osw.close();
fos.close();
}?catch?(Exception?e)?{
System.out.println(e.getMessage());
}?

//選出特征詞
top_feature(tempw);
//輸出權(quán)重在前面的特征及權(quán)重
try?{
FileOutputStream?fos?=?new?FileOutputStream(topFeatureFile);
OutputStreamWriter?osw?=?new?OutputStreamWriter(fos);
BufferedWriter?bw?=?new?BufferedWriter(osw);
for(int?i=0;i bw.write(temp[i]+“??“);
bw.write(String.valueOf(w[i]));
bw.newLine();
}
bw.close();
osw.close();
fos.close();
}?catch?(Exception?e)?{
System.out.println(e.getMessage());
}?
try?{
FileOutputStream?fos?=?new?FileOutputStream(termnonum);
OutputStreamWriter?osw?=?new?OutputStreamWriter(fos);
BufferedWriter?bw?=?new?BufferedWriter(osw);
for(int?i=0;i bw.write(temp[i]);
bw.newLine();
}
bw.close();
osw.close();
fos.close();
}?catch?(Exception?e)?{
System.out.println(e.getMessage());
}?

?String[]?temp2?=?new?String[1024];//所有詞語(yǔ)存的數(shù)組
int?[]?w2?;?//用來記錄每個(gè)詞的權(quán)重
int?k2=100;?//取權(quán)重最高的前K個(gè)feature
String?termWeighFile2=“termWeigh2.txt“;??//用于保存全部《特征?,權(quán)重》對(duì)
String?topFeatureFile2=“Feature2.txt“;??//保存前k個(gè)《特征?,權(quán)重》對(duì)
String?termnonum2=“Featrueno2.txt“;//保存《特征》
String?dirName2=“D:\\2013fall\\數(shù)字內(nèi)容安全實(shí)驗(yàn)\\3\\訓(xùn)練集\\軍事\\“;??//存放所有語(yǔ)料集的目錄地址,如C://
//初始化w
????w2=new?int[1024];

????//把語(yǔ)料集全部列出來
File?dir2?=?new?File(dirName2);??
File[]?files2?=?dir2.listFiles();?
//總結(jié)所有詞匯
remwords(files2w2temp2);
//刪除干擾詞
for(int?a=0;a if(IsStopWord(temp2[a])){
delet(?temp2a?w2);

}
}

//輸出《特征,權(quán)重》對(duì)
try?{
File

?屬性????????????大小?????日期????時(shí)間???名稱
-----------?---------??----------?-----??----
?????目錄???????????0??2013-11-24?22:12??df\
?????文件?????????301??2013-11-20?17:22??df\.classpath
?????文件?????????378??2013-11-20?17:22??df\.project
?????目錄???????????0??2013-11-20?17:22??df\.settings\
?????文件?????????598??2013-11-20?17:22??df\.settings\org.eclipse.jdt.core.prefs
?????目錄???????????0??2013-11-20?17:22??df\bin\
?????目錄???????????0??2013-11-24?22:19??df\bin\df\
?????文件????????8126??2013-11-24?22:17??df\bin\df\dfb.class
?????文件?????????501??2013-11-24?22:17??df\Featrueno.txt
?????文件?????????659??2013-11-24?22:17??df\Featrueno2.txt
?????文件????????1034??2013-11-24?22:17??df\Feature.txt
?????文件????????1192??2013-11-24?22:17??df\Feature2.txt
?????目錄???????????0??2013-11-20?17:22??df\src\
?????目錄???????????0??2013-11-21?18:21??df\src\df\
?????文件????????7605??2013-11-24?22:17??df\src\df\dfb.java
?????文件???????10143??2013-11-24?22:17??df\termWeigh.txt
?????文件???????11368??2013-11-24?22:17??df\termWeigh2.txt

評(píng)論

共有 條評(píng)論