HebrewTokenizer

Tokenizes a given stream using HebMorph's Tokenizer, removes prefixes where possible, and tags Tokens with appropriate types where possible

Constructors

Link copied to clipboard
constructor(prefixes: MutableMap<String, Int>)
constructor(_prefixesTree: MutableMap<String, Int>, specialCases: DictRadix<Byte>?)

Types

Link copied to clipboard
object Companion
Link copied to clipboard
interface TOKEN_TYPES

Properties

Functions

Link copied to clipboard
fun <T : Attribute> addAttribute(attClass: KClass<T>): T
Link copied to clipboard
Link copied to clipboard
Link copied to clipboard
Link copied to clipboard
Link copied to clipboard
open override fun close()
Link copied to clipboard
fun copyTo(target: AttributeSource)
Link copied to clipboard
open override fun end()
Link copied to clipboard
Link copied to clipboard
open operator override fun equals(obj: Any?): Boolean
Link copied to clipboard
fun <T : Attribute> getAttribute(attClass: KClass<T>): T?
Link copied to clipboard
fun hasAttribute(attClass: KClass<out Attribute>): Boolean
Link copied to clipboard
Link copied to clipboard
open override fun hashCode(): Int
Link copied to clipboard
open override fun incrementToken(): Boolean
Link copied to clipboard
Link copied to clipboard
fun reflectAsString(prependAttClass: Boolean): String
Link copied to clipboard
Link copied to clipboard
Link copied to clipboard
open override fun reset()
Link copied to clipboard
Link copied to clipboard
fun setReader(input: Reader)
Link copied to clipboard
fun setSuffixForExactMatch(suffixForExactMatch: Char?)
Link copied to clipboard
open override fun toString(): String
Link copied to clipboard