nlp

Type Members

trait AttrCubbieSlots extends util.Cubbie
class BasicSection extends Section

A simple concrete implementation of Section.
trait DateAttrCubbieSlot extends util.Cubbie with AttrCubbieSlots
class Document extends DocumentSubstring with Attr

A Document holds a String containing the original raw string contents of a natural language document to be processed.
class DocumentAnnotationPipeline extends DocumentAnnotator

A sequence of DocumentAnnotators packaged as a single DocumentAnnotator.
trait DocumentAnnotator extends AnyRef
type DocumentAnnotatorMap = Map[Class[_], () ⇒ DocumentAnnotator]

Mapping from annotation class (usually stored in an attr) and the DocumentAnnotor from which it can be obtained.
class DocumentCubbie[TC <: TokenCubbie, SC <: SentenceCubbie, TSC <: TokenSpanCubbie] extends util.Cubbie with AttrCubbieSlots

A Cubbie for serializing a Document, with separate slots for the Tokens, Sentences, and TokenSpans.
case class DocumentName(string: String) extends Product with Serializable

Used as an attribute on Document to hold the document's name.
trait DocumentSubstring extends AnyRef

A portion of the string contents of a Document.
class MutableDocumentAnnotatorMap extends LinkedHashMap[Class[_], () ⇒ DocumentAnnotator]

A Map from annotation class to DocumentAnnotator that provides that annotation.
trait Section extends Chain[Section, Token] with DocumentSubstring with Attr

A part of a Document, delineated by character offsets into the Document's string, and which can hold a sequence of Tokens and a sequence of Sentences.
class Sentence extends TokenSpan

A span of Tokens making up a sentence within a Section of a Document.
class SentenceCubbie extends TokenSpanCubbie
trait SentenceParseCubbie extends SentenceCubbie
trait SharedNLPCmdOptions extends CmdOptions

Command-line options available on all NLP model trainers.
class Token extends Observation[Token] with ChainLink[Token, Section] with DocumentSubstring with Attr

A word in a document, covering a substring of the Document.
class TokenCubbie extends util.Cubbie
trait TokenIobConllNerTagCubbie extends TokenCubbie
trait TokenPennPosTagCubbie extends TokenCubbie
class TokenSpan extends SpanVariable[Section, Token] with Attr

A sub-sequence of Tokens within a Section (which is in turn part of a Document).
class TokenSpanBuffer[S <: TokenSpan] extends SpanVarBuffer[S, Section, Token] with TokenSpanCollection[S]

A mutable collection of TokenSpans, with various methods to returns filtered sub-sets of spans based on position and class.
trait TokenSpanCollection[S <: TokenSpan] extends SpanVarCollection[S, Section, Token]
class TokenSpanCubbie extends util.Cubbie
class TokenSpanList[S <: TokenSpan] extends SpanVarList[S, Section, Token] with TokenSpanCollection[S]

An immutable collection of TokenSpans, with various methods to returns filtered sub-sets of spans based on position and class.
trait TokenSpanNerLabelCubbieSlot extends TokenSpanCubbie
trait TokenSpanWithDocRefCubbie[DC <: DocumentCubbie[_, _, _]] extends TokenSpanCubbie
trait TokenSpanWithPhraseCubbie extends TokenSpanCubbie
class TokenString extends StringVariable

Used as an attribute of Token when the token.
trait TokenStringCubbieSlot extends TokenCubbie

Value Members

object DocumentAnnotatorPipeline extends FastLogging

A factory for creating DocumentAnnotatorPipelines given requirements about which annotations or which DocumentAnnotators are desired.
object NLP

A command-line driver for DocumentAnnotators.
object NoopDocumentAnnotator extends DocumentAnnotator
object TokenSpan
object UnknownDocumentAnnotator extends DocumentAnnotator

Used as a stand-in dummy DocumentAnnotator in the DocumentAnnotatorMap when an annotation was added but not by a real DocumentAnnotator.
def bilouBoundaries(labels: Seq[String]): Seq[(Int, Int, String)]
def bioBoundaries(labels: Seq[String]): Seq[(Int, Int)]
package coref
package embeddings
package hcoref
def iobBoundaries(labels: Seq[String]): Seq[(Int, Int, String)]

Given a sequence of strings describing labels in IOB format, such as O I-PER I-LOC B-LOC I-LOC O I-ORG, (where I, B prefixes are separated by a dash from the type suffix) return a sequence of tuples indicating span start, length and label suffix, such as (3, 2, "LOC").
package lemma
package lexicon
package load
package morph
package ner
package parse
package phrase
package pos
package relation
package segment
package wordnet

package nlp

Type Members

trait AttrCubbieSlots extends util.Cubbie

class BasicSection extends Section

trait DateAttrCubbieSlot extends util.Cubbie with AttrCubbieSlots

class Document extends DocumentSubstring with Attr

class DocumentAnnotationPipeline extends DocumentAnnotator

trait DocumentAnnotator extends AnyRef

type DocumentAnnotatorMap = Map[Class[_], () ⇒ DocumentAnnotator]

class DocumentCubbie[TC <: TokenCubbie, SC <: SentenceCubbie, TSC <: TokenSpanCubbie] extends util.Cubbie with AttrCubbieSlots

case class DocumentName(string: String) extends Product with Serializable

trait DocumentSubstring extends AnyRef

class MutableDocumentAnnotatorMap extends LinkedHashMap[Class[_], () ⇒ DocumentAnnotator]

trait Section extends Chain[Section, Token] with DocumentSubstring with Attr

class Sentence extends TokenSpan

class SentenceCubbie extends TokenSpanCubbie

trait SentenceParseCubbie extends SentenceCubbie

trait SharedNLPCmdOptions extends CmdOptions

class Token extends Observation[Token] with ChainLink[Token, Section] with DocumentSubstring with Attr

class TokenCubbie extends util.Cubbie

trait TokenIobConllNerTagCubbie extends TokenCubbie

trait TokenPennPosTagCubbie extends TokenCubbie

class TokenSpan extends SpanVariable[Section, Token] with Attr

class TokenSpanBuffer[S <: TokenSpan] extends SpanVarBuffer[S, Section, Token] with TokenSpanCollection[S]

trait TokenSpanCollection[S <: TokenSpan] extends SpanVarCollection[S, Section, Token]

class TokenSpanCubbie extends util.Cubbie

class TokenSpanList[S <: TokenSpan] extends SpanVarList[S, Section, Token] with TokenSpanCollection[S]

trait TokenSpanNerLabelCubbieSlot extends TokenSpanCubbie

trait TokenSpanWithDocRefCubbie[DC <: DocumentCubbie[_, _, _]] extends TokenSpanCubbie

trait TokenSpanWithPhraseCubbie extends TokenSpanCubbie

class TokenString extends StringVariable

trait TokenStringCubbieSlot extends TokenCubbie

Value Members

object DocumentAnnotatorPipeline extends FastLogging

object NLP

object NoopDocumentAnnotator extends DocumentAnnotator

object TokenSpan

object UnknownDocumentAnnotator extends DocumentAnnotator

def bilouBoundaries(labels: Seq[String]): Seq[(Int, Int, String)]

def bioBoundaries(labels: Seq[String]): Seq[(Int, Int)]

package coref

package embeddings

package hcoref

def iobBoundaries(labels: Seq[String]): Seq[(Int, Int, String)]

package lemma

package lexicon

package load

package morph

package ner

package parse

package phrase

package pos

package relation

package segment

package wordnet

Inherited from AnyRef

Inherited from Any

Ungrouped