当前位置:软件学习 > Word >>

POI读取word

[java] 
package Java.se.lucene; 
 
import java.io.FileInputStream; 
import java.io.FileNotFoundException; 
import java.io.IOException; 
 
import org.apache.poi.hwpf.HWPFDocument;   
import org.apache.poi.hwpf.usermodel.Paragraph;   
import org.apache.poi.hwpf.usermodel.Range;   
 
public class WordToTxt { 
    //创建字符串缓冲区 
    /*
     * 不能写成StringBuffer stringBuffer=null;
     * 否则会报空指针异常
     */ 
    StringBuffer stringBuffer=new StringBuffer(); 
     
    //转换word 
    public String readWord() 
    { 
        //word文档路径 
        String pathword="F:\\lucene\\doc\\1.doc"; 
        try { 
            //创建存储word文档的对象 
            HWPFDocument doc = new HWPFDocument(new FileInputStream(pathword)); 
            //用来获得word文档内容 
            Range range=doc.getRange(); 
            //文档段落数目 
            int paragraphCount=range.numParagraphs(); 
            //遍历段落读取数据 
            for(int i=0;i<paragraphCount;i++) 
            { 
                Paragraph pph=range.getParagraph(i); 
                stringBuffer.append(pph.text()); 
                System.out.println(stringBuffer.toString()); 
            } 
        } catch (FileNotFoundException e) { 
            e.printStackTrace(); 
        } catch (IOException e) { 
            e.printStackTrace(); 
        }  
        return stringBuffer.toString().trim(); 
    } 
   
    public static void main(String[] args) { 
        new WordToTxt().readWord(); 
    } 

 
 
补充:软件开发 , C++ ,
CopyRight © 2012 站长网 编程知识问答 www.zzzyk.com All Rights Reserved
部份技术文章来自网络,