public class NativeExtractor extends PartExtractor
Modifier and Type | Class and Description |
---|---|
static class |
NativeExtractor.Extractors |
PartExtractor.ExtractCtx, PartExtractor.ExtractCtxBase
log
condition
Constructor and Description |
---|
NativeExtractor() |
NativeExtractor(boolean annotateHTML,
boolean skipInvisibleHTMLText) |
NativeExtractor(boolean annotateHTML,
boolean skipInvisibleHTMLText,
boolean extractHTMLTables) |
NativeExtractor(boolean annotateHTML,
boolean skipInvisibleHTMLText,
boolean extractJs,
boolean extractHTMLTables,
boolean extractHTMLStyles,
boolean extractHTMLForms,
int maxHTMLAnnotationDepth)
Deprecated.
|
NativeExtractor(boolean annotateHTML,
boolean skipInvisibleHTMLText,
boolean extractHTMLTables,
int maxHTMLAnnotationDepth) |
NativeExtractor(boolean annotateHTML,
boolean skipInvisibleHTMLText,
NativeExtractor.Extractors extractors,
int maxHTMLAnnotationDepth) |
Modifier and Type | Method and Description |
---|---|
void |
convertToOctree(int maxDepth,
double cellPrec,
exa.io2.ByteBuffer b,
exa.io2.DynamicBuffer out) |
protected java.lang.String |
getDirective(PartExtractor.ExtractCtx ctx,
java.lang.String dirname,
java.lang.String defaultname) |
protected void |
handleBinaryNDoc(PartExtractor.ExtractCtx ctx) |
protected void |
handleHtml(PartExtractor.ExtractCtx ctx) |
protected void |
handleMatrix(PartExtractor.ExtractCtx ctx) |
protected void |
handleMesh(PartExtractor.ExtractCtx ctx) |
void |
handlePart(PartExtractor.ExtractCtx ctx) |
protected void |
handleText(PartExtractor.ExtractCtx ctx) |
protected void |
handleXMLNDoc(PartExtractor.ExtractCtx ctx) |
void |
process(DocumentProcessingContext context,
ProcessableDocument document)
Process a document.
|
void |
release()
Release all processor ressources.
This method is called before processor finalization. |
canHandlePart, getDirective, partHasNoIndexDirective
getCondition, init, setCondition
public NativeExtractor(boolean annotateHTML, boolean skipInvisibleHTMLText)
public NativeExtractor(boolean annotateHTML, boolean skipInvisibleHTMLText, boolean extractHTMLTables)
public NativeExtractor(boolean annotateHTML, boolean skipInvisibleHTMLText, boolean extractHTMLTables, int maxHTMLAnnotationDepth)
@Deprecated public NativeExtractor(boolean annotateHTML, boolean skipInvisibleHTMLText, boolean extractJs, boolean extractHTMLTables, boolean extractHTMLStyles, boolean extractHTMLForms, int maxHTMLAnnotationDepth)
public NativeExtractor(boolean annotateHTML, boolean skipInvisibleHTMLText, NativeExtractor.Extractors extractors, int maxHTMLAnnotationDepth)
public NativeExtractor()
public void release()
DocumentProcessor
release
in interface DocumentProcessor
release
in class StandardDocumentProcessor
public void process(DocumentProcessingContext context, ProcessableDocument document)
DocumentProcessor
process
in interface DocumentProcessor
process
in class PartExtractor
context
- Context to perform various operations related to processingdocument
- The document being processed.public void handlePart(PartExtractor.ExtractCtx ctx)
handlePart
in class PartExtractor
protected void handleHtml(PartExtractor.ExtractCtx ctx)
protected void handleText(PartExtractor.ExtractCtx ctx)
protected java.lang.String getDirective(PartExtractor.ExtractCtx ctx, java.lang.String dirname, java.lang.String defaultname)
protected void handleMesh(PartExtractor.ExtractCtx ctx)
protected void handleMatrix(PartExtractor.ExtractCtx ctx)
protected void handleXMLNDoc(PartExtractor.ExtractCtx ctx)
protected void handleBinaryNDoc(PartExtractor.ExtractCtx ctx)
public void convertToOctree(int maxDepth, double cellPrec, exa.io2.ByteBuffer b, exa.io2.DynamicBuffer out)
Copyright © 2013 Dassault Systèmes, All Rights Reserved.