Go to the documentation of this file.
37 #include "ticcutils/LogStream.h"
38 #include "ticcutils/Configuration.h"
39 #include "ticcutils/Unicode.h"
40 #include "libfolia/folia.h"
46 mwuAna(
const std::string&,
bool,
size_t );
66 #define mymap2 std::multimap<std::string, std::vector<std::string> >
71 explicit Mwu( TiCC::LogStream*, TiCC::LogStream* );
74 bool init(
const TiCC::Configuration& );
79 const std::vector<folia::Word*>& )
const;
81 std::string
getTagset()
const {
return mwu_tagset; };
82 std::string
version()
const {
return _version; };
84 bool readsettings(
const std::string&,
const std::string&);
85 bool read_mwus(
const std::string& );
88 std::string mwuFileName;
89 std::vector<mwuAna*> mWords;
91 TiCC::LogStream *errLog;
92 TiCC::LogStream *dbgLog;
94 std::string textclass;
95 std::string mwu_tagset;
97 TiCC::UniFilter *filter;
friend std::ostream & operator<<(std::ostream &, const Mwu &)
Definition: mwu_chunker_mod.cxx:217
bool spec
Definition: mwu_chunker_mod.h:63
void Classify(frog_data &)
Definition: mwu_chunker_mod.cxx:249
virtual ~mwuAna()
Definition: mwu_chunker_mod.h:47
a datastructure to hold all frogged information of one Sentence
Definition: FrogData.h:76
size_t mwu_end
Definition: mwu_chunker_mod.h:58
std::string word
Definition: mwu_chunker_mod.h:61
bool isSpec()
Definition: mwu_chunker_mod.h:55
bool init(const TiCC::Configuration &)
Definition: mwu_chunker_mod.cxx:149
std::string getWord() const
Definition: mwu_chunker_mod.h:51
#define mymap2
Definition: mwu_chunker_mod.h:66
a simple datastructure to hold all frogged information of one word
Definition: FrogData.h:47
std::string getTagset() const
return the value for mwu_tagset. (set via Configuration)
Definition: mwu_chunker_mod.h:81
void add_result(const frog_data &, const std::vector< folia::Word * > &) const
Definition: mwu_chunker_mod.cxx:385
Definition: mwu_chunker_mod.h:68
Definition: mwu_chunker_mod.h:43
void add_provenance(folia::Document &, folia::processor *) const
Definition: mwu_chunker_mod.cxx:227
void add(frog_record &)
Definition: mwu_chunker_mod.cxx:107
mwuAna()
Definition: mwu_chunker_mod.h:61
~Mwu()
Definition: mwu_chunker_mod.cxx:91
std::string version() const
Definition: mwu_chunker_mod.h:82
friend std::ostream & operator<<(std::ostream &, const mwuAna &)
void reset()
Definition: mwu_chunker_mod.cxx:99
size_t mwu_start
Definition: mwu_chunker_mod.h:55
void merge(const mwuAna *)
Definition: mwu_chunker_mod.cxx:66
Mwu(TiCC::LogStream *, TiCC::LogStream *)
Definition: mwu_chunker_mod.cxx:78