#include "libwords.h" #include #include using namespace lib_words; std::shared_ptr WordReader::wordsFrom(QTextStream &tin, const QString& path) const { auto primary_words = extract_primary(tin, path); if (!primary_words.size()) return nullptr; std::shared_ptr prev_ptr = std::make_shared(primary_words.last(), nullptr); for (auto idx = primary_words.size() - 2; idx >= 0; --idx) { auto content_ptr = primary_words[idx]; prev_ptr = std::make_shared(content_ptr, prev_ptr); } return prev_ptr; } QList> lib_words::WordReader::extract_primary(QTextStream& tin, const QString& f) const{ QList> ret_list; int line_number = 1; while (!tin.atEnd()) { uint64_t relative_offset = line_number; relative_offset = relative_offset << 32; auto line = tin.readLine(); ret_list.append(this->parse_line(relative_offset, line_number++, line, f)); } return ret_list; } #include QList> WordReader::parse_line(uint64_t start_pos, int row, const QString& line_text, const QString& path) const { QRegExp split_char(u8"\\s"); auto words = line_text.split(split_char, QString::SplitBehavior::SkipEmptyParts); QList> primary_words; int columns_offset = 0; for (auto& w : words) { auto column_start = line_text.indexOf(w, columns_offset); auto token = std::make_shared(row, column_start + 1, start_pos + column_start, w, path); primary_words << token; columns_offset = column_start + w.length(); } return primary_words; } WordImpl::WordImpl(std::shared_ptr content, std::shared_ptr next) : content_ptr(content), next_ptr(next) { } QString WordImpl::file() const { return content_ptr->file(); } uint64_t WordImpl::position() const { return content_ptr->position(); } QString WordImpl::content() const { return content_ptr->content(); } int WordImpl::row() const { return content_ptr->row(); } int WordImpl::column() const { return content_ptr->column(); } std::shared_ptr WordImpl::nextWord() const { return next_ptr; } WordsException::WordsException(const QString& message) : msg_store(message) { } QString WordsException::message() const { return msg_store; } WordContent::WordContent(int r, int c, uint64_t pos, const QString& t, const QString& p) : row_n(r), col_n(c), doc_offset(pos), text_n(t), path_p(p) { } QString WordContent::file() const { return path_p; } uint64_t WordContent::position() const { return doc_offset; } QString WordContent::content() const { return text_n; } int WordContent::row() const { return row_n; } int WordContent::column() const { return col_n; } std::shared_ptr WordContent::nextWord() const { return nullptr; }