conllu

Types

pub type Feature {
  PronType(String)
  Gender(String)
  VerbForm(String)
  NumType(String)
  Animacy(String)
  Mood(String)
  Poss(String)
  NounClass(String)
  Tense(String)
  Reflex(String)
  Number(String)
  Aspect(String)
  Foreign(String)
  Case(String)
  Voice(String)
  Abbr(String)
  Definite(String)
  Evident(String)
  Typo(String)
  Deixis(String)
  Polarity(String)
  DeixisRef(String)
  Person(String)
  Degree(String)
  Polite(String)
  Clusivity(String)
  Custom(String, String)
}

Constructors

  • PronType(String)
  • Gender(String)
  • VerbForm(String)
  • NumType(String)
  • Animacy(String)
  • Mood(String)
  • Poss(String)
  • NounClass(String)
  • Tense(String)
  • Reflex(String)
  • Number(String)
  • Aspect(String)
  • Foreign(String)
  • Case(String)
  • Voice(String)
  • Abbr(String)
  • Definite(String)
  • Evident(String)
  • Typo(String)
  • Deixis(String)
  • Polarity(String)
  • DeixisRef(String)
  • Person(String)
  • Degree(String)
  • Polite(String)
  • Clusivity(String)
  • Custom(String, String)
pub type ParseError {
  InvalidData(WordParts)
  MissingWordInformation(WordParts)
}

Constructors

  • InvalidData(WordParts)
  • MissingWordInformation(WordParts)
pub type Sentence {
  Sentence(
    sent_id: Option(String),
    text: Option(String),
    text_lang: Option(#(String, String)),
    translit: Option(String),
    comments: List(String),
    words: List(Word),
  )
}

Constructors

  • Sentence(
      sent_id: Option(String),
      text: Option(String),
      text_lang: Option(#(String, String)),
      translit: Option(String),
      comments: List(String),
      words: List(Word),
    )

    Arguments

    • text_lang

      ex: text_en = “”

Universal POS tag based on https://universaldependencies.org/u/pos/index.html

pub type UPOS {
  ADJ
  ADP
  ADV
  AUX
  CCONJ
  DET
  INTJ
  NOUN
  NUM
  PART
  PRON
  PROPN
  PUNCT
  SCONJ
  SYM
  VERB
  X
}

Constructors

  • ADJ

    adjective

  • ADP

    adposition

  • ADV

    adverb

  • AUX

    auxiliary

  • CCONJ

    coordinating conjunction

  • DET

    determiner

  • INTJ

    interjection

  • NOUN

    noun

  • NUM

    numeral

  • PART

    particle

  • PRON

    pronoun

  • PROPN

    proper noun

  • PUNCT

    punctuation

  • SCONJ

    subordinating conjunction

  • SYM

    symbol

  • VERB

    verb

  • X

    other

A single word with grammatical information

pub type Word {
  Word(
    index: Int,
    form: String,
    lemma: String,
    upos: UPOS,
    xpos: Option(String),
    feats: Option(List(Feature)),
    head: Option(Int),
    deprel: Option(String),
    deps: Option(String),
    misc: Option(String),
  )
}

Constructors

  • Word(
      index: Int,
      form: String,
      lemma: String,
      upos: UPOS,
      xpos: Option(String),
      feats: Option(List(Feature)),
      head: Option(Int),
      deprel: Option(String),
      deps: Option(String),
      misc: Option(String),
    )
pub type WordParts {
  Index
  Form
  Lemma
  UPOS
  XPOS
  Feats
  Head
  Deprel
  Deps
  Misc
}

Constructors

  • Index
  • Form
  • Lemma
  • UPOS
  • XPOS
  • Feats
  • Head
  • Deprel
  • Deps
  • Misc

Functions

pub fn parse(input: String) -> Result(List(Sentence), ParseError)
Search Document