package cn.com.dao;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStream;
import org.textmining.text.extraction.WordExtractor;
public class ReadWord {
public String readWord(){
String str=null;
InputStream in =null;
try{
in = new FileInputStream ("F://word1.doc");
WordExtractor extractor = new WordExtractor();
str = extractor.extractText(in); //读取word文档的内容,放入string里
int leng = str.length(); //word文档的内容长度
int leng1 = str.trim().length(); //因为word文档存储的时候回存在回车等情况,所以需要取出空格
/*if(!(leng1==0)){ //判断word文档是否为空
System.out.println(str);//word文档的内容打印
}*/
}catch(Exception e){
e.printStackTrace();
}finally{
try {
in.close();
} catch (IOException e) {
e.printStackTrace();
}
}
return str.split("第一阶段")[0];
}
public String readWord(String path){
String str=null;
InputStream in =null;
try{
in = new FileInputStream (path);
WordExtractor extractor = new WordExtractor();
str = extractor.extractText(in); //读取word文档的内容,放入string里
int leng = str.length(); //word文档的内容长度
int leng1 = str.trim().length(); //因为word文档存储的时候回存在回车等情况,所以需要取出空格
/*if(!(leng1==0)){ //判断word文档是否为空
System.out.println(str);//word文档的内容打印
}*/
}catch(Exception e){
e.printStackTrace();
}finally{
try {
in.close();
} catch (IOException e) {
e.printStackTrace();
}
}
return str.split("第一阶段")[0];
}
}