Class

com.salesforce.op.utils.text

LuceneRegexTextAnalyzer

Related Doc: package text

Permalink

class LuceneRegexTextAnalyzer extends LuceneTextAnalyzer

Text analyzer implementation using a Lucene analyzer with Pattern Tokenizer matching

Linear Supertypes

LuceneTextAnalyzer, TextAnalyzer, Serializable, Serializable, AnyRef, Any

Ordering

Alphabetic
By Inheritance

Inherited

LuceneRegexTextAnalyzer
LuceneTextAnalyzer
TextAnalyzer
Serializable
Serializable
AnyRef
Any

Hide All
Show All

Visibility

Public
All

Instance Constructors

new LuceneRegexTextAnalyzer(pattern: String, group: Int = 1)

pattern

is the regular expression

group

selects the matching group as the token (default: -1, which is equivalent to "split".

Value Members

final def !=(arg0: Any): Boolean

Definition Classes

AnyRef → Any
final def ##(): Int

Definition Classes

AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes

AnyRef → Any
def analyze(s: String, language: Language): Seq[String]

Analyze a text and produce tokens

Analyze a text and produce tokens

s

input text

language

assumed text language

returns

sequence of tokens

Definition Classes

LuceneTextAnalyzer → TextAnalyzer
def analyzers(lang: Language): Analyzer

Lucene analyzer factory to use (defaults to LuceneTextAnalyzer)

Lucene analyzer factory to use (defaults to LuceneTextAnalyzer)

lang

desired language

returns

language specific language analyzer

Definition Classes

LuceneRegexTextAnalyzer → LuceneTextAnalyzer
final def asInstanceOf[T0]: T0

Definition Classes

Any
def clone(): AnyRef

Attributes

protected[java.lang]

Definition Classes

AnyRef

Annotations

@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes

AnyRef
def equals(arg0: Any): Boolean

Definition Classes

AnyRef → Any
def finalize(): Unit

Attributes

protected[java.lang]

Definition Classes

AnyRef

Annotations

@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes

AnyRef → Any
val group: Int

selects the matching group as the token (default: -1, which is equivalent to "split".
def hashCode(): Int

Definition Classes

AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes

Any
final def ne(arg0: AnyRef): Boolean

Definition Classes

AnyRef
final def notify(): Unit

Definition Classes

AnyRef
final def notifyAll(): Unit

Definition Classes

AnyRef
val pattern: String

is the regular expression
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes

AnyRef
def toString(): String

Definition Classes

AnyRef → Any
final def wait(): Unit

Definition Classes

AnyRef

Annotations

@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes

AnyRef

Annotations

@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes

AnyRef

Annotations

@throws( ... )

Inherited from LuceneTextAnalyzer

Inherited from TextAnalyzer

Inherited from Serializable

Inherited from Serializable

Inherited from AnyRef

Inherited from Any

Ungrouped