import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.IOException;
import java.util.List;
import org.apache.poi.hwpf.HWPFDocument;
import org.apache.poi.hwpf.extractor.*;
import org.apache.poi.hwpf.model.*;
import org.apache.poi.hwpf.usermodel.CharacterRun;
import org.apache.poi.hwpf.usermodel.Picture;
import org.apache.poi.hwpf.usermodel.Range;
public class MsWordExtractor {
/**
* @param args
* @throws IOException
*/
public static void main(String[] args) throws IOException{
//下面注释掉的是提取所有文字的
// FileInputStream in = new FileInputStream("D:/poiWord/rule.doc");
// WordExtractor extractor = new WordExtractor(in);
//
// String [] strArray = extractor.getParagraphText();
// String str = extractor.getText();
// for(int i = 0; i < strArray.length; +