Go to the documentation of this file.
39 #include "ticcutils/json.hpp"
65 std::vector<std::vector<std::string>>
morphs;
84 std::string
sentence(
bool =
false )
const;
87 std::map<size_t,size_t>
mwus;
friend frog_data extract_fd(std::vector< Tokenizer::Token > &)
a datastructure to hold all frogged information of one Sentence
Definition: FrogData.h:76
std::vector< std::string > lemmas
a list of possible lemma's
Definition: FrogData.h:64
std::string compound_string
string representation of first compound
Definition: FrogData.h:67
double iob_confidence
the confidence of the IOB tag
Definition: FrogData.h:61
std::string sentence(bool=false) const
Definition: FrogData.cxx:232
std::string tag
the assigned POS tag
Definition: FrogData.h:58
std::string word
the word in UTF8
Definition: FrogData.h:52
bool no_space
was there a space after the word?
Definition: FrogData.h:56
std::string language
the deteected language of the word
Definition: FrogData.h:55
frog_record()
default constructor
Definition: FrogData.cxx:44
double tag_confidence
the confidence of the POS tag
Definition: FrogData.h:59
Definition: mbma_brackets.h:74
std::string parse_role
role of the dependency
Definition: FrogData.h:71
std::string clean_word
lowercased word (MBMA only)
Definition: FrogData.h:53
void append(const frog_record &)
Definition: FrogData.cxx:292
a simple datastructure to hold all frogged information of one word
Definition: FrogData.h:47
std::string morph_string
string representation of first morph
Definition: FrogData.h:68
nlohmann::json to_json() const
Definition: FrogData.cxx:63
bool empty() const
Definition: FrogData.h:80
std::string ner_tag
the assigned NER tag
Definition: FrogData.h:62
int parse_index
label of the dependency
Definition: FrogData.h:70
Definition: FrogData.h:42
std::set< size_t > parts
set of indeces a MWU is made of (MWU only)
Definition: FrogData.h:72
std::string token_class
the assigned token class of the word
Definition: FrogData.h:54
std::vector< frog_record > units
the records that make up the sentence
Definition: FrogData.h:85
~frog_record()
default destructor
Definition: FrogData.cxx:57
std::map< size_t, size_t > mwus
Definition: FrogData.h:87
void resolve_mwus()
Definition: FrogData.cxx:250
std::string get_language() const
Definition: FrogData.cxx:300
bool new_paragraph
did the tokenizer detect a paragraph here?
Definition: FrogData.h:57
std::ostream & operator<<(std::ostream &os, const frog_record &fr)
Definition: FrogData.cxx:123
std::string iob_tag
the assigned IOB tag
Definition: FrogData.h:60
size_t size() const
Definition: FrogData.h:79
std::vector< frog_record > mw_units
the MWU records that make up the sentence
Definition: FrogData.h:86
double ner_confidence
the confidence of the NER tag
Definition: FrogData.h:63
std::vector< std::vector< std::string > > morphs
the morph analysis
Definition: FrogData.h:65
std::vector< const BaseBracket * > deep_morphs
pointers to the deep morphemes
Definition: FrogData.h:66
std::string deep_morph_string
string representation of first deep_morph
Definition: FrogData.h:69