Temporarily write only the method that reads the word content.
Dependent jar:
Poi-3.9-20121203.jar
Poi-ooxml-3.9-20121203.jar
Xmlbeans-2.3.0.jar
PackageCom.word;ImportJava.io.File;ImportJava.io.FileInputStream;ImportJava.io.InputStream;Importorg.apache.poi.POIXMLDocument;ImportOrg.apache.poi.POIXMLTextExtractor;ImportOrg.apache.poi.hwpf.extractor.WordExtractor;ImportOrg.apache.poi.openxml4j.opc.OPCPackage;ImportOrg.apache.poi.xwpf.extractor.XWPFWordExtractor;/** * @authorQiaojiafei *@versioncreated: February 22, 2016 11:30:04 * class Description*/ Public classOptionword { Public Static voidMain (string[] args) {//TODO auto-generated Method Stub } Public Staticstringbuffer Readword (string path) {string S= ""; Try { if(Path.endswith (". Doc") ) {InputStream is=NewFileInputStream (NewFile (path)); Wordextractor ex=NewWordextractor (IS); S=Ex.gettext (); }Else if(Path.endswith ("docx") {opcpackage opcpackage=poixmldocument.openpackage (path); Poixmltextextractor Extractor=NewXwpfwordextractor (opcpackage); S=Extractor.gettext (); }Else{System.out.println ("The incoming Word file is incorrect:" +path); } } Catch(Exception e) {e.printstacktrace (); } stringbuffer BF=NewStringBuffer (s); returnBF; }}
Java reads Word content