Skip to content
Snippets Groups Projects
Commit 304d2f43 authored by Bartosz Broda's avatar Bartosz Broda
Browse files

add stub for parsing

parent 7fd62f3c
Branches
No related merge requests found
#include "mwereader.h" #include "mwereader.h"
#include "mweparser.h"
#include <boost/algorithm/string.hpp> #include <boost/algorithm/string.hpp>
namespace Corpus2{ namespace Corpus2{
bool MWEReader::registered = TokenReader::register_path_reader<MWEReader>( bool MWEReader::registered = TokenReader::register_path_reader<MWEReader>(
"mwereader","inner,mwepath"); // TODO more help? "mwereader","inner,mwefile"); // TODO more help?
MWEReader::MWEReader(const Tagset &tagset, const std::string &filename) MWEReader::MWEReader(const Tagset &tagset, const std::string &filename)
: TokenReader(tagset), inner_filename_(filename) : TokenReader(tagset), inner_filename_(filename)
...@@ -43,11 +44,15 @@ bool MWEReader::registered = TokenReader::register_path_reader<MWEReader>( ...@@ -43,11 +44,15 @@ bool MWEReader::registered = TokenReader::register_path_reader<MWEReader>(
if(boost::algorithm::starts_with(option, "inner:")) { if(boost::algorithm::starts_with(option, "inner:")) {
std::string inner = option.substr(6); std::string inner = option.substr(6);
inner_reader_ = create_path_reader(inner, this->tagset(), inner_reader_ = create_path_reader(inner, this->tagset(),
inner_filename_); inner_filename_);
}
if(boost::algorithm::starts_with(option, "mwefile:")) {
std::string mwefile = option.substr(8);
load_mwes(mwefile);
} }
// TODO MWE stuff // TODO more MWE stuff
} }
void MWEReader::validate() void MWEReader::validate()
...@@ -66,5 +71,11 @@ bool MWEReader::registered = TokenReader::register_path_reader<MWEReader>( ...@@ -66,5 +71,11 @@ bool MWEReader::registered = TokenReader::register_path_reader<MWEReader>(
return inner_reader_->get_option(option); return inner_reader_->get_option(option);
} }
void MWEReader::load_mwes(const std::string &filename)
{
MWEParser parser;
parser.parse_file(filename);
}
}// ns Corpus2 }// ns Corpus2
...@@ -3,6 +3,8 @@ ...@@ -3,6 +3,8 @@
#include <libcorpus2/io/reader.h> #include <libcorpus2/io/reader.h>
#include "mwe.h"
namespace Corpus2 { namespace Corpus2 {
...@@ -43,7 +45,11 @@ public: ...@@ -43,7 +45,11 @@ public:
virtual void validate(); virtual void validate();
static bool registered; static bool registered;
private: private:
void load_mwes(const std::string& filename);
//MWEIndex mwe_index_;
/// ptr to inner reader doing the real work of reading a corpus /// ptr to inner reader doing the real work of reading a corpus
TokenReaderPtr inner_reader_; TokenReaderPtr inner_reader_;
/// path for inner reader /// path for inner reader
......
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment