public class Tokenizer extends UnaryTransformer<java.lang.String,scala.collection.Seq<java.lang.String>,Tokenizer>
RegexTokenizer
,
Serialized FormConstructor and Description |
---|
Tokenizer() |
Tokenizer(java.lang.String uid) |
Modifier and Type | Method and Description |
---|---|
Tokenizer |
copy(ParamMap extra)
Creates a copy of this instance with the same UID and some extra params.
|
protected scala.Function1<java.lang.String,scala.collection.Seq<java.lang.String>> |
createTransformFunc()
Creates the transform function using the given param map.
|
protected DataType |
outputDataType()
Returns the data type of the output column.
|
java.lang.String |
uid()
An immutable unique ID for the object and its derivatives.
|
protected void |
validateInputType(DataType inputType)
Validates the input type.
|
setInputCol, setOutputCol, transform, transformSchema
transform, transform, transform
transformSchema
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
initializeIfNecessary, initializeLogging, isTraceEnabled, log_, log, logDebug, logDebug, logError, logError, logInfo, logInfo, logName, logTrace, logTrace, logWarning, logWarning
clear, copyValues, defaultCopy, defaultParamMap, explainParam, explainParams, extractParamMap, extractParamMap, get, getDefault, getOrDefault, getParam, hasDefault, hasParam, isDefined, isSet, paramMap, params, set, set, set, setDefault, setDefault, shouldOwn, validateParams
toString
public java.lang.String uid()
Identifiable
protected scala.Function1<java.lang.String,scala.collection.Seq<java.lang.String>> createTransformFunc()
UnaryTransformer
createTransformFunc
in class UnaryTransformer<java.lang.String,scala.collection.Seq<java.lang.String>,Tokenizer>
protected void validateInputType(DataType inputType)
UnaryTransformer
validateInputType
in class UnaryTransformer<java.lang.String,scala.collection.Seq<java.lang.String>,Tokenizer>
inputType
- (undocumented)protected DataType outputDataType()
UnaryTransformer
outputDataType
in class UnaryTransformer<java.lang.String,scala.collection.Seq<java.lang.String>,Tokenizer>
public Tokenizer copy(ParamMap extra)
Params
copy
in interface Params
copy
in class UnaryTransformer<java.lang.String,scala.collection.Seq<java.lang.String>,Tokenizer>
extra
- (undocumented)defaultCopy()