1 #ifndef TOKENIZED_SENTENCE_HDR
2 #define TOKENIZED_SENTENCE_HDR
4 #include "concordia/common/config.hpp"
5 #include "concordia/token_annotation.hpp"
6 #include "concordia/word_map.hpp"
8 #include <boost/shared_ptr.hpp>
13 #include <boost/foreach.hpp>
51 return _originalSentence;
66 return _tokenAnnotations;
73 std::vector<INDEX_CHARACTER_TYPE>
getCodes()
const {
120 friend std::ostream & operator << (std::ostream & o,
136 std::string _sentence;
138 std::string _originalSentence;
140 std::list<TokenAnnotation> _tokenAnnotations;
142 std::vector<INDEX_CHARACTER_TYPE> _codes;
144 std::vector<TokenAnnotation> _tokens;
std::string getSentence() const
Definition: tokenized_sentence.hpp:42
virtual ~TokenizedSentence()
Definition: tokenized_sentence.cpp:14
std::string getOriginalSentence() const
Definition: tokenized_sentence.hpp:50
void generateTokens()
Definition: tokenized_sentence.cpp:70
void toLowerCase()
Definition: tokenized_sentence.cpp:56
int getType() const
Definition: token_annotation.hpp:36
std::list< TokenAnnotation > getAnnotations() const
Definition: tokenized_sentence.hpp:65
SUFFIX_MARKER_TYPE getStart() const
Definition: interval.hpp:49
SUFFIX_MARKER_TYPE getEnd() const
Definition: interval.hpp:56
Definition: tokenized_sentence.hpp:26
std::vector< TokenAnnotation > getTokens() const
Definition: tokenized_sentence.hpp:82
TokenizedSentence(std::string sentence)
Definition: tokenized_sentence.cpp:9
void generateHash(boost::shared_ptr< WordMap > wordMap)
Definition: tokenized_sentence.cpp:60
std::string getTokenizedSentence() const
Definition: tokenized_sentence.cpp:79
std::vector< INDEX_CHARACTER_TYPE > getCodes() const
Definition: tokenized_sentence.hpp:73
Definition: token_annotation.hpp:16
std::string getValue() const
Definition: token_annotation.hpp:43
void addAnnotations(std::vector< TokenAnnotation > annotations)
Definition: tokenized_sentence.cpp:17