📄 docextractor.java
字号:
package invertedList;
import java.io.BufferedInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.IOException;
import org.apache.poi.hwpf.extractor.WordExtractor;
/**
* @author Administrator
* A class to extract content from a doc file.
*/
public class DocExtractor extends Extractor {
/* (non-Javadoc)
* @see invertedList.Extractor#getInformation(java.io.File)
*/
/**
* @see invertedList.Extractor#getInformation(java.io.File)
* get the content of a doc file
*/
@Override
public String getInformation(File file) {
BufferedInputStream is;
try {
is = new BufferedInputStream(new FileInputStream(file));
WordExtractor extractor = new WordExtractor(is);
is.close();
return extractor.getText();
} catch (FileNotFoundException e1) {
// TODO Auto-generated catch block
e1.printStackTrace();
} catch (IOException e2){
e2.printStackTrace();
}
return null;
}
}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -