Go to the documentation of this file.
36 #include "timbl/TimblAPI.h"
38 #include "ticcutils/Configuration.h"
39 #include "ticcutils/LogStream.h"
40 #include "ticcutils/FdStream.h"
41 #include "ticcutils/ServerBase.h"
43 #include "libfolia/folia.h"
44 #include "ucto/tokenize.h"
170 const TiCC::Configuration&,
176 folia::Document *
FrogFile(
const std::string&, std::ostream& );
177 void FrogServer( Sockets::ClientSocket &conn );
186 folia::Document *run_folia_engine(
const std::string&,
188 folia::Document *run_text_engine(
const std::string&,
190 folia::FoliaElement* start_document(
const std::string&,
191 folia::Document *& )
const;
192 folia::FoliaElement *append_to_folia( folia::FoliaElement *,
194 unsigned int& )
const;
195 void add_ner_result( folia::Sentence *,
197 const std::vector<folia::Word*>& )
const;
198 void add_iob_result( folia::Sentence *,
200 const std::vector<folia::Word*>& )
const;
201 void add_mwu_result( folia::Sentence *,
203 const std::vector<folia::Word*>& )
const;
204 void add_parse_result( folia::Sentence *,
206 const std::vector<folia::Word*>& )
const;
207 folia::processor *add_provenance( folia::Document& )
const;
208 void test_version(
const std::string&,
double );
210 void FrogStdin(
bool prompt );
211 void output_tabbed( std::ostream&,
213 void output_JSON( std::ostream& os,
216 void show_results( std::ostream&,
218 void handle_one_paragraph( std::ostream&,
221 void handle_one_text_parent( std::ostream&,
222 folia::FoliaElement *e,
224 void handle_one_sentence( std::ostream&,
227 void append_to_sentence( folia::Sentence *,
const frog_data& )
const;
228 void append_to_words(
const std::vector<folia::Word*>&,
230 void handle_word_vector( std::ostream&,
231 const std::vector<folia::Word*>&,
234 const TiCC::Configuration& configuration;
236 TiCC::LogStream *theErrLog;
237 TiCC::LogStream *theDbgLog;
250 bool make_flat=
false );
Definition: cgn_tagger_mod.h:38
std::string Frogtostringfromfile(const std::string &)
a datastructure to hold all frogged information of one Sentence
Definition: FrogData.h:76
std::string encoding
which input-encoding do we expect
Definition: FrogAPI.h:124
bool doMwu
should we resolve Multi Word Units?
Definition: FrogAPI.h:65
bool correct_words
should we allow the tokenizer to correct words?
Definition: FrogAPI.h:150
std::vector< std::string > get_full_morph_analysis(folia::Word *word, bool make_flat=false)
Definition: ucto_tokenizer_mod.h:36
std::string textredundancy
determines how much text is added in the FoLiA
Definition: FrogAPI.h:137
bool doQuoteDetection
enable quote detection (NOT USED)
Definition: FrogAPI.h:74
bool test_API
do we want to run some tests?
Definition: FrogAPI.h:97
Definition: mbma_mod.h:53
std::string docid
the FoLiA document ID on output.
Definition: FrogAPI.h:130
bool doAlpino
should we directly run Alpino?
Definition: FrogAPI.h:110
void FrogServer(Sockets::ClientSocket &conn)
bool doSentencePerLine
do we want a sentence per line?
Definition: FrogAPI.h:70
bool doXMLin
do we have FoLiA input?
Definition: FrogAPI.h:83
bool hide_timers
should we output timing information?
Definition: FrogAPI.h:101
std::set< std::string > languages
all languages to take into account
Definition: FrogAPI.h:134
this class holds the runtime settings for Frog
Definition: FrogAPI.h:59
a simple datastructure to hold all frogged information of one word
Definition: FrogData.h:47
bool doJSONin
do we have JSON input?
Definition: FrogAPI.h:85
bool doLemma
should we run the lemmatizer?
Definition: FrogAPI.h:62
Definition: FrogAPI.h:167
FrogOptions()
Definition: FrogAPI.cxx:128
folia::Document * FrogFile(const std::string &, std::ostream &)
bool doTagger
should we run the Dependency Parser?
Definition: FrogAPI.h:69
bool doKanon
do we want FoLiA to be output in a canonical way?
Definition: FrogAPI.h:93
std::vector< std::string > get_compound_analysis(folia::Word *word)
bool interactive
are we running from the command line?
Definition: FrogAPI.h:105
bool doRetry
set retry mode (MISNOMER)
Definition: FrogAPI.h:78
bool doServer
do we want to run as a server?
Definition: FrogAPI.h:90
std::string Frogtostring(const std::string &)
std::string uttmark
the string which separates Utterances
Definition: FrogAPI.h:128
bool doJSONout
do we want JSON output?
Definition: FrogAPI.h:89
Definition: mwu_chunker_mod.h:68
int JSON_pp
for JSON output, use this value to format.
Definition: FrogAPI.h:119
std::string listenport
determines the port to run the Frog Server on
Definition: FrogAPI.h:129
static std::string defaultConfigFile(const std::string &="")
Definition: FrogAPI.cxx:117
bool noStdOut
do we want output to stdout?
Definition: FrogAPI.h:82
std::string command
stores the original command that invoked Frog
Definition: FrogAPI.h:158
bool doAlpinoServer
should we try to connect to an Alpino server?
Definition: FrogAPI.h:106
Definition: ner_tagger_mod.h:44
bool doTok
should we run the tokenizer?
Definition: FrogAPI.h:61
static std::string defaultConfigDir(const std::string &="")
Definition: FrogAPI.cxx:101
int numThreads
limit for the number of threads
Definition: FrogAPI.h:114
bool doXMLout
do we want FoLiA output?
Definition: FrogAPI.h:84
bool doMorph
should we run the morphological analyzer?
Definition: FrogAPI.h:63
bool doNER
should we run the Named Entity recognizer?
Definition: FrogAPI.h:67
frog_data frog_sentence(std::vector< Tokenizer::Token > &, const size_t)
bool doIOB
should we run the IOB Chuker?
Definition: FrogAPI.h:66
int debugFlag
value for the generic debug level
Definition: FrogAPI.h:115
Definition: mblem_mod.h:54
unsigned int maxParserTokens
limit the number of words to Parse
Definition: FrogAPI.h:154
FrogAPI(FrogOptions &, const TiCC::Configuration &, TiCC::LogStream *, TiCC::LogStream *)
std::string inputclass
the textclass to use on FoLiA input
Definition: FrogAPI.h:131
bool doDeepMorph
do we want a deep morphological analysis?
Definition: FrogAPI.h:64
void run_api_tests(const std::string &, std::ostream &)
bool doParse
should we run the Dependency Parser?
Definition: FrogAPI.h:68
Definition: Frog-util.h:51
Definition: iob_tagger_mod.h:37
std::string outputclass
the textclass to use on FoLiA output
Definition: FrogAPI.h:132
std::string default_language
what is our default language
Definition: FrogAPI.h:133