public class TokenizerFunction extends BaseTokenizerFunction implements org.apache.spark.api.java.function.Function<java.lang.String,Sequence<VocabWord>>
configurationBroadcast, tokenizerFactory, tokenPreprocessor
Constructor and Description |
---|
TokenizerFunction(org.apache.spark.broadcast.Broadcast<VectorsConfiguration> configurationBroadcast) |
Modifier and Type | Method and Description |
---|---|
Sequence<VocabWord> |
call(java.lang.String s) |
instantiateTokenizerFactory
public TokenizerFunction(@NonNull org.apache.spark.broadcast.Broadcast<VectorsConfiguration> configurationBroadcast)