concordia-library/concordia/anonymized_sentence.cpp

#include "concordia/anonymized_sentence.hpp"
#include "concordia/common/text_utils.hpp"

#include <iostream>

AnonymizedSentence::AnonymizedSentence(std::string sentence):
                                         _sentence(sentence) {
}

AnonymizedSentence::~AnonymizedSentence() {
}

void AnonymizedSentence::addAnnotations(std::vector<TokenAnnotation> annotations) {
    std::vector<TokenAnnotation>::iterator newAnnotation = annotations.begin();
    std::list<TokenAnnotation>::iterator existingAnnotation = _tokenAnnotations.begin();
    
    while(newAnnotation != annotations.end()) {
        if (existingAnnotation != _tokenAnnotations.end()) {
            // there are still some existing annotations, so perform checks
            if (newAnnotation->intersects(*existingAnnotation)) {
                // The new annotation intersects with the existing.
                // We can not add it, so let us just move on to the
                // next new annoation.
                newAnnotation++;
            } else {
                // it is now important whether the new interval is before
                // or after existing
                if (newAnnotation->getStart() < existingAnnotation->getStart()) {
                    // New interval does not intersect and is before existing. We add it.
                    _tokenAnnotations.insert(existingAnnotation, *newAnnotation);
                    newAnnotation++;
                } else {
                    // If the new interval is after existing we move to the next existing annoation.
                    existingAnnotation++;
                }
            }
        } else {
            // no more existing annotations, so just add the new annotation
            _tokenAnnotations.push_back(*newAnnotation);
            newAnnotation++;
        }
    }
    
}

void AnonymizedSentence::toLowerCase() {
    _sentence = TextUtils::getInstance().toLowerCase(_sentence);
}
character intervals in progress 2015-06-22 13:52:56 +02:00			`#include "concordia/anonymized_sentence.hpp"`
			`#include "concordia/common/text_utils.hpp"`

			`#include <iostream>`

			`AnonymizedSentence::AnonymizedSentence(std::string sentence):`
			`_sentence(sentence) {`
			`}`

			`AnonymizedSentence::~AnonymizedSentence() {`
			`}`

			`void AnonymizedSentence::addAnnotations(std::vector<TokenAnnotation> annotations) {`
			`std::vector<TokenAnnotation>::iterator newAnnotation = annotations.begin();`
			`std::list<TokenAnnotation>::iterator existingAnnotation = _tokenAnnotations.begin();`

			`while(newAnnotation != annotations.end()) {`
			`if (existingAnnotation != _tokenAnnotations.end()) {`
			`// there are still some existing annotations, so perform checks`
			`if (newAnnotation->intersects(*existingAnnotation)) {`
			`// The new annotation intersects with the existing.`
			`// We can not add it, so let us just move on to the`
			`// next new annoation.`
			`newAnnotation++;`
			`} else {`
			`// it is now important whether the new interval is before`
			`// or after existing`
			`if (newAnnotation->getStart() < existingAnnotation->getStart()) {`
			`// New interval does not intersect and is before existing. We add it.`
			`_tokenAnnotations.insert(existingAnnotation, *newAnnotation);`
			`newAnnotation++;`
			`} else {`
			`// If the new interval is after existing we move to the next existing annoation.`
			`existingAnnotation++;`
			`}`
			`}`
			`} else {`
			`// no more existing annotations, so just add the new annotation`
			`_tokenAnnotations.push_back(*newAnnotation);`
			`newAnnotation++;`
			`}`
			`}`

			`}`

			`void AnonymizedSentence::toLowerCase() {`
			`_sentence = TextUtils::getInstance().toLowerCase(_sentence);`
			`}`