List of usage examples for org.apache.poi.xwpf.usermodel XWPFRelation DOCUMENT
XWPFRelation DOCUMENT
To view the source code for org.apache.poi.xwpf.usermodel XWPFRelation DOCUMENT.
Click Source Link
From source file:org.apache.tika.parser.microsoft.ooxml.xwpf.ml2006.Word2006MLDocHandler.java
License:Apache License
public Word2006MLDocHandler(XHTMLContentHandler xhtml, Metadata metadata, ParseContext context) { this.xhtml = xhtml; this.metadata = metadata; this.parseContext = context; OfficeParserConfig officeParserConfig = context.get(OfficeParserConfig.class); addPartHandler(new RelationshipsHandler(relationshipsManager)); addPartHandler(new WordAndPowerPointTextPartHandler(XWPFRelation.DOCUMENT.getContentType(), xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler(XWPFRelation.FOOTNOTE.getContentType(), xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.endnotes+xml", xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler(XWPFRelation.HEADER.getContentType(), xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler(XWPFRelation.FOOTER.getContentType(), xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.comments+xml", xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.footnotes+xml", xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new WordAndPowerPointTextPartHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.document.glossary+xml", xhtml, relationshipsManager, officeParserConfig)); addPartHandler(new CorePropertiesHandler(metadata)); addPartHandler(new ExtendedPropertiesHandler(metadata)); binaryDataHandler = new BinaryDataHandler(xhtml, metadata, context); }
From source file:org.apache.tika.parser.microsoft.ooxml.xwpf.Word2006MLHandler.java
License:Apache License
public Word2006MLHandler(XHTMLContentHandler handler, Metadata metadata, ParseContext context) { this.handler = handler; this.metadata = metadata; this.parseContext = context; addPackageHandler(new RelationshipsHandler(relationshipsManager)); addPackageHandler(new BodyContentHandler(XWPFRelation.DOCUMENT.getContentType(), relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler(XWPFRelation.FOOTNOTE.getContentType(), relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.endnotes+xml", relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler(XWPFRelation.HEADER.getContentType(), relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler(XWPFRelation.FOOTER.getContentType(), relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.comments+xml", relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.document.glossary+xml", relationshipsManager, handler, metadata, context)); addPackageHandler(new BodyContentHandler( "application/vnd.openxmlformats-officedocument.wordprocessingml.footnotes+xml", relationshipsManager, handler, metadata, context)); addPackageHandler(new CorePropertiesHandler(metadata)); addPackageHandler(new ExtendedPropertiesHandler(metadata)); binaryDataHandler = new BinaryDataHandler(handler, metadata, context); }
From source file:org.apache.tika.parser.microsoft.ooxml.xwpf.XWPFEventBasedWordExtractor.java
License:Apache License
@Override public String getText() { StringBuilder sb = new StringBuilder(); //handle main document List<PackagePart> pps = container.getPartsByContentType(XWPFRelation.DOCUMENT.getContentType()); if (pps != null) { for (PackagePart pp : pps) { //likely only one, but why not... try { handleDocumentPart(pp, sb); } catch (IOException e) { e.printStackTrace();// w w w . j a v a2 s. co m } catch (SAXException e) { e.printStackTrace(); } } } //handle glossary document pps = container.getPartsByContentType(XWPFRelation.GLOSSARY_DOCUMENT.getContentType()); if (pps != null) { for (PackagePart pp : pps) { //likely only one, but why not... try { handleDocumentPart(pp, sb); } catch (IOException e) { e.printStackTrace(); } catch (SAXException e) { e.printStackTrace(); } } } return sb.toString(); }