package common
Ordering
- Alphabetic
Visibility
- Public
- All
Type Members
- trait Annotated[TResult] extends AnyRef
- case class ConllSentence(dependency: String, lemma: String, uPos: String, xPos: String, deprel: String, head: Int, sentence: Int, begin: Int, end: Int) extends Product with Serializable
- case class DependencyParsedSentence(tokens: Array[WordWithDependency]) extends Product with Serializable
- case class IndexedTaggedWord(word: String, tag: String, begin: Int = 0, end: Int = 0, confidence: Option[Array[Map[String, String]]] = None, metadata: Map[String, String] = Map()) extends Product with Serializable
- case class IndexedToken(token: String, begin: Int = 0, end: Int = 0) extends Product with Serializable
- class InfixToken extends PreprocessingParser
- class PrefixedToken extends PreprocessingParser
- trait PreprocessingParser extends AnyRef
-
case class
Sentence(content: String, start: Int, end: Int, index: Int, metadata: Option[Map[String, String]] = None) extends Product with Serializable
structure representing a sentence and its boundaries
- class SuffixedToken extends PreprocessingParser
- case class TableData(header: List[String], rows: List[List[String]]) extends Product with Serializable
- trait Tagged[T >: TaggedSentence <: TaggedSentence] extends Annotated[T]
-
case class
TaggedSentence(taggedWords: Array[TaggedWord], indexedTaggedWords: Array[IndexedTaggedWord] = Array()) extends Product with Serializable
Structure to hold Sentences as list of words and POS-tags
Structure to hold Sentences as list of words and POS-tags
- taggedWords
Word tag pairs
-
case class
TaggedWord(word: String, tag: String) extends Product with Serializable
Word tag pair
- case class TokenPiece(wordpiece: String, token: String, pieceId: Int, isWordStart: Boolean, begin: Int, end: Int) extends Product with Serializable
- case class TokenPieceEmbeddings(wordpiece: String, token: String, pieceId: Int, isWordStart: Boolean, isOOV: Boolean, embeddings: Array[Float], begin: Int, end: Int) extends Product with Serializable
-
case class
TokenizedSentence(indexedTokens: Array[IndexedToken], sentenceIndex: Int) extends Product with Serializable
Internal structure for a sentence that is split into tokens
- case class WordWithDependency(word: String, begin: Int, end: Int, head: Int) extends Product with Serializable
- case class WordpieceEmbeddingsSentence(tokens: Array[TokenPieceEmbeddings], sentenceId: Int) extends Product with Serializable
- case class WordpieceTokenizedSentence(tokens: Array[TokenPiece]) extends Product with Serializable
Value Members
- object Annotated
-
object
ChunkSplit extends Annotated[Sentence]
Helper object to work work with Chunks
- object DatasetHelpers
- object DependencyParsed extends Annotated[DependencyParsedSentence]
- object EmbeddingsWithSentence extends Annotated[TokenizedSentence]
- object InfixToken
- object LabeledDependency extends Annotated[ConllSentence]
- object NerTagged extends Tagged[NerTaggedSentence]
- object PosTagged extends Tagged[PosTaggedSentence]
- object PrefixedToken
- object Sentence extends Serializable
-
object
SentenceSplit extends Annotated[Sentence]
Helper object to work work with Sentence
- object SuffixedToken
- object TableData extends Serializable
- object TaggedSentence extends Serializable
- object TokenPieceEmbeddings extends Serializable
- object TokenizedWithSentence extends Annotated[TokenizedSentence]
- object WordpieceEmbeddingsSentence extends Annotated[WordpieceEmbeddingsSentence] with Serializable
- object WordpieceTokenized extends Annotated[WordpieceTokenizedSentence]