public class WordDocExtractor
extends WordExtractor
Modifier and Type | Field and Description |
---|---|
static float |
TWIPS_PER_INCH |
static int |
TWIPS_PER_PT |
Constructor and Description |
---|
WordDocExtractor(ParseContext context) |
Modifier and Type | Method and Description |
---|---|
static TagAndStyle |
buildParagraphTagAndStyle(java.lang.String styleName,
boolean isTable) |
protected void |
parse(POIFSFileSystem filesystem,
XHTMLContentHandler xhtml) |
protected void |
parseWord6(POIFSFileSystem filesystem,
XHTMLContentHandler xhtml) |
public static final float TWIPS_PER_INCH
public static final int TWIPS_PER_PT
protected void parse(POIFSFileSystem filesystem, XHTMLContentHandler xhtml) throws java.io.IOException, org.xml.sax.SAXException, TikaException
java.io.IOException
org.xml.sax.SAXException
TikaException
protected void parseWord6(POIFSFileSystem filesystem, XHTMLContentHandler xhtml) throws java.io.IOException, org.xml.sax.SAXException, TikaException
java.io.IOException
org.xml.sax.SAXException
TikaException
public static TagAndStyle buildParagraphTagAndStyle(java.lang.String styleName, boolean isTable)