2013-10-24 17:08:58 +02:00
|
|
|
#include <sstream>
|
2015-04-16 11:39:39 +02:00
|
|
|
#include <stdlib.h>
|
2013-10-24 17:08:58 +02:00
|
|
|
#include "concordia/concordia_config.hpp"
|
|
|
|
#include "concordia/common/logging.hpp"
|
|
|
|
|
|
|
|
#define PUDDLE_TAGSET_PARAM "puddle_tagset_path"
|
2013-11-28 16:47:57 +01:00
|
|
|
#define WORD_MAP_PARAM "word_map_path"
|
|
|
|
#define HASHED_INDEX_PARAM "hashed_index_path"
|
2014-02-20 10:49:17 +01:00
|
|
|
#define MARKERS_PARAM "markers_path"
|
2013-11-28 16:47:57 +01:00
|
|
|
#define SUFFIX_ARRAY_PARAM "suffix_array_path"
|
2014-04-29 14:46:04 +02:00
|
|
|
#define HTML_TAGS_PARAM "html_tags_path"
|
|
|
|
#define SPACE_SYMBOLS_PARAM "space_symbols_path"
|
|
|
|
#define STOP_WORDS_PARAM "stop_words_path"
|
|
|
|
#define NAMED_ENTITIES_PARAM "named_entities_path"
|
|
|
|
#define STOP_SYMBOLS_PARAM "stop_symbols_path"
|
2015-04-16 11:39:39 +02:00
|
|
|
#define ANUBIS_THRESHOLD_PARAM "anubis_threshold"
|
2013-10-24 17:08:58 +02:00
|
|
|
|
2015-04-15 14:14:10 +02:00
|
|
|
ConcordiaConfig::ConcordiaConfig(const std::string & configFilePath)
|
2013-10-24 17:08:58 +02:00
|
|
|
throw(ConcordiaException) {
|
|
|
|
try {
|
|
|
|
_config.readFile(configFilePath.c_str());
|
2015-04-15 14:14:10 +02:00
|
|
|
} catch(libconfig::ParseException & e) {
|
2013-10-24 17:08:58 +02:00
|
|
|
throw ConcordiaException("Error parsing config file: "+configFilePath);
|
2015-04-15 14:14:10 +02:00
|
|
|
} catch(libconfig::FileIOException & e) {
|
2013-10-24 17:08:58 +02:00
|
|
|
throw ConcordiaException("I/O error reading config file: "
|
|
|
|
+configFilePath);
|
|
|
|
}
|
|
|
|
|
|
|
|
_puddleTagsetFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(PUDDLE_TAGSET_PARAM);
|
2013-11-28 16:47:57 +01:00
|
|
|
_wordMapFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(WORD_MAP_PARAM);
|
|
|
|
_hashedIndexFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(HASHED_INDEX_PARAM);
|
2014-02-20 10:49:17 +01:00
|
|
|
_markersFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(MARKERS_PARAM);
|
2013-11-28 16:47:57 +01:00
|
|
|
_suffixArrayFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(SUFFIX_ARRAY_PARAM);
|
2014-04-29 14:46:04 +02:00
|
|
|
_htmlTagsFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(HTML_TAGS_PARAM);
|
|
|
|
_spaceSymbolsFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(SPACE_SYMBOLS_PARAM);
|
|
|
|
_stopWordsFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(STOP_WORDS_PARAM);
|
|
|
|
_namedEntitiesFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(NAMED_ENTITIES_PARAM);
|
|
|
|
_stopSymbolsFilePath =
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(STOP_SYMBOLS_PARAM);
|
2015-04-16 11:39:39 +02:00
|
|
|
_anubisThreshold =
|
|
|
|
atof(
|
|
|
|
ConcordiaConfig::_readConfigParameterStr(ANUBIS_THRESHOLD_PARAM).c_str());
|
2013-10-24 17:08:58 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
ConcordiaConfig::~ConcordiaConfig() {
|
|
|
|
}
|
|
|
|
|
2015-04-15 14:14:10 +02:00
|
|
|
std::string ConcordiaConfig::_readConfigParameterStr(const std::string & name)
|
2013-10-24 17:08:58 +02:00
|
|
|
throw(ConcordiaException) {
|
|
|
|
if (!_config.exists(name)) {
|
|
|
|
throw ConcordiaException("Config error: "+name+" setting not found");
|
|
|
|
} else {
|
|
|
|
return _config.lookup(name);
|
|
|
|
}
|
|
|
|
}
|