資源簡(jiǎn)介
poi將word里面的內(nèi)容轉(zhuǎn)換成html、包括word里面字體的大小、表格的處理、還有圖片、段落等等...

代碼片段和文件信息
package?net.sunflower.demo;
import?java.io.BufferedWriter;??
import?java.io.File;??
import?java.io.FileInputStream;??
import?java.io.FileNotFoundException;??
import?java.io.FileOutputStream;??
import?java.io.IOException;??
import?java.io.OutputStream;??
import?java.io.OutputStreamWriter;??
??
import?org.apache.poi.hwpf.HWPFDocument;??
import?org.apache.poi.hwpf.model.PicturesTable;??
import?org.apache.poi.hwpf.usermodel.CharacterRun;??
import?org.apache.poi.hwpf.usermodel.Picture;??
import?org.apache.poi.hwpf.usermodel.Range;??
import?org.apache.poi.hwpf.usermodel.Paragraph;?????
import?org.apache.poi.hwpf.usermodel.Table;?????
import?org.apache.poi.hwpf.usermodel.TableCell;?????
import?org.apache.poi.hwpf.usermodel.TableIterator;?????
import?org.apache.poi.hwpf.usermodel.TableRow;?????
??
??
public?class?WordtoHtml?{??
??
????/**?
?????*?回車(chē)符ASCII碼?
?????*/??
????private?static?final?short?ENTER_ASCII?=?13;??
??
????/**?
?????*?空格符ASCII碼?
?????*/??
????private?static?final?short?SPACE_ASCII?=?32;??
??
????/**?
?????*?水平制表符ASCII碼?
?????*/??
????private?static?final?short?TABULATION_ASCII?=?9;??
??
????public?static?String?htmlText?=?““;??
????public?static?String?htmlTextTbl?=?““;??
????public?static?int?counter=0;??
????public?static?int?beginPosi=0;??
????public?static?int?endPosi=0;??
????public?static?int?beginArray[];??
????public?static?int?endArray[];??
????public?static?String?htmlTextArray[];??
????public?static?boolean?tblExist=false;??
??????
????public?static?void?main(String?argv[])??
????{?????????
????????try?{??
???????? getWordAndstyle(“D://kexie/讀取科協(xié).doc“);
????????}?catch?(Exception?e)?{??
????????????e.printStackTrace();??
????????}??
????}??
??????
????/**?
?????*?讀取每個(gè)文字樣式?
?????*??
?????*?@param?fileName?
?????*?@throws?Exception?
?????*/??
??
??????
????public?static?void?getWordAndstyle(String?fileName)?throws?Exception?{??
????????FileInputStream?in?=?new?FileInputStream(new?File(fileName));??
????????HWPFDocument?doc?=?new?HWPFDocument(in);??
??????????
?????????Range?rangetbl?=?doc.getRange();//得到文檔的讀取范圍?????
?????????TableIterator?it?=?new?TableIterator(rangetbl);???
?????????int?num=100;??????????
??????????
???????????
?????????beginArray=new?int[num];??
?????????endArray=new?int[num];??
?????????htmlTextArray=new?String[num];??
????????//?取得文檔中字符的總數(shù)??
????????int?length?=?doc.characterLength();??
????????//?創(chuàng)建圖片容器??
????????PicturesTable?pTable?=?doc.getPicturesTable();??
??????????
????????htmlText?=?“tle>“?+?doc.getSummaryInformation().gettitle()?+?“ tle>“;??
????????//?創(chuàng)建臨時(shí)字符串好加以判斷一串字符是否存在相同格式??
??????????
?????????if(it.hasNext())??
?????????{??
?????????????readTable(itrangetbl);??
?????????}??
???????????
?????????int?cur=0;??
??????????????
????????String?tempString?=?““;??
????????for?(int?i?=?0;?i?????????????//?整篇文章的字符通過(guò)一個(gè)個(gè)字符的來(lái)判斷range為得到文檔的范圍??
????????????
?屬性????????????大小?????日期????時(shí)間???名稱(chēng)
-----------?---------??----------?-----??----
?????文件????1760031??2011-10-25?20:19??poi將word轉(zhuǎn)換成html\poi-3.8-beta4-20110826.jar
?????文件????1129968??2011-10-25?20:19??poi將word轉(zhuǎn)換成html\poi-scratchpad-3.8-beta4-20110826.jar
?????文件??????10342??2013-03-04?10:19??poi將word轉(zhuǎn)換成html\WordtoHtml.java
?????目錄??????????0??2013-03-04?10:21??poi將word轉(zhuǎn)換成html
-----------?---------??----------?-----??----
??????????????2900341????????????????????4
評(píng)論
共有 條評(píng)論