Class TokenizerApplier
- java.lang.Object
-
- org.apache.sysds.runtime.transform.tokenize.applier.TokenizerApplier
-
- All Implemented Interfaces:
Serializable
- Direct Known Subclasses:
TokenizerApplierCount,TokenizerApplierHash,TokenizerApplierPosition
public abstract class TokenizerApplier extends Object implements Serializable
- See Also:
- Serialized Form
-
-
Field Summary
Fields Modifier and Type Field Description static StringPADDING_STRING
-
Constructor Summary
Constructors Constructor Description TokenizerApplier(int numIdCols, int maxTokens, boolean wideFormat, boolean applyPadding)
-
Method Summary
All Methods Instance Methods Abstract Methods Concrete Methods Modifier and Type Method Description voidallocateInternalMeta(int numDocuments)intapplyInternalRepresentation(DocumentRepresentation[] internalRepresentation, FrameBlock out)voidbuild(DocumentRepresentation[] internalRepresentation, int inputRowStart, int blk)List<DependencyTask<?>>getApplyTasks(DocumentRepresentation[] internalRepresentation, FrameBlock out)List<DependencyTask<?>>getBuildTasks(DocumentRepresentation[] internalRepresentation)intgetMaxNumRows(int inRows)intgetMaxTokens()longgetNumCols()abstract intgetNumRows(DocumentRepresentation[] internalRepresentation)<T,E>
intgetOutputRow(int inputRowStart, List<Map<T,E>> internalData)intgetOutputRow(int inputRowStart, DocumentRepresentation[] internalData)abstract Types.ValueType[]getOutSchema()booleanhasPadding()booleanisWideFormat()
-
-
-
Field Detail
-
PADDING_STRING
public static final String PADDING_STRING
- See Also:
- Constant Field Values
-
-
Method Detail
-
applyInternalRepresentation
public int applyInternalRepresentation(DocumentRepresentation[] internalRepresentation, FrameBlock out)
-
build
public void build(DocumentRepresentation[] internalRepresentation, int inputRowStart, int blk)
-
getBuildTasks
public List<DependencyTask<?>> getBuildTasks(DocumentRepresentation[] internalRepresentation)
-
getApplyTasks
public List<DependencyTask<?>> getApplyTasks(DocumentRepresentation[] internalRepresentation, FrameBlock out)
-
getOutSchema
public abstract Types.ValueType[] getOutSchema()
-
hasPadding
public boolean hasPadding()
-
getMaxTokens
public int getMaxTokens()
-
getMaxNumRows
public int getMaxNumRows(int inRows)
-
getNumRows
public abstract int getNumRows(DocumentRepresentation[] internalRepresentation)
-
getOutputRow
public int getOutputRow(int inputRowStart, DocumentRepresentation[] internalData)
-
getNumCols
public long getNumCols()
-
isWideFormat
public boolean isWideFormat()
-
allocateInternalMeta
public void allocateInternalMeta(int numDocuments)
-
-