WsParser_VS/libSyntax/libsyntax.cpp

442 lines
13 KiB
C++

#include "libsyntax.h"
#include "ast_basic.h"
#include <tuple>
#include <QDebug>
using namespace lib_syntax;
using namespace std;
using namespace lib_token;
using namespace lib_words;
using namespace ast_basic;
auto content_extractm = [](std::shared_ptr<const lib_token::IActionToken> token) {
QString content;
while (token) {
if (token->defines())
content.prepend(token->content() + " ");
token = token->prevToken();
}
return content;
};
__anyone_impl::__anyone_impl(const QList<std::shared_ptr<const IBasicRule>> mbrs) : mbrs_store(mbrs) {
}
QList<std::shared_ptr<const IBasicRule>> __anyone_impl::children() const {
return mbrs_store;
}
QList<std::shared_ptr<const MatchCursor>> __anyone_impl::parse(std::shared_ptr<const MatchCursor> cursor) const {
if (cursor->parseFailure() || cursor->parseComplete())
return QList<std::shared_ptr<const MatchCursor>>() << cursor;
auto syntax = present();
QList<std::shared_ptr<const MatchCursor>> result_list;
for (auto rx : this->children())
result_list.append(rx->parse(cursor));
// 完全匹配分支,必须有匹配进展
decltype(result_list) completely_list;
std::copy_if(result_list.begin(), result_list.end(), std::back_inserter(completely_list),
[&](std::shared_ptr<const MatchCursor> ins) {
return (cursor->totalErrorCount() == ins->totalErrorCount() && ins->operator>(*cursor))
|| ins->parseComplete();
});
if (completely_list.size())
return completely_list.mid(0,1);
// 经过修正的分支,必须有变化
decltype(result_list) modify_list;
std::copy_if(result_list.begin(), result_list.end(),
std::back_inserter(modify_list),
[&](std::shared_ptr<const MatchCursor> ins) {
return !ins->parseFailure() && ins->totalErrorCount() > cursor->totalErrorCount();
});
if (modify_list.size())
return modify_list;
// 匹配失败的分支
decltype(result_list) errors_list;
std::copy_if(result_list.begin(), result_list.end(),
std::back_inserter(errors_list), [](std::shared_ptr<const MatchCursor> it) { return it->parseFailure(); });
return errors_list;
}
QString __anyone_impl::present() const {
QString members_content;
for (auto& it : children()) {
members_content += it->present() + "|";
}
return members_content.mid(0, members_content.size() - 1);
}
__sequence_impl::__sequence_impl(const QList<std::shared_ptr<const IBasicRule>> mbrs)
: mbrs_store(mbrs) {
}
QList<std::shared_ptr<const IBasicRule>> __sequence_impl::children() const {
return mbrs_store;
}
QList<std::shared_ptr<const MatchCursor>> __sequence_impl::parse(std::shared_ptr<const MatchCursor> cursor) const {
if (cursor->parseFailure() || cursor->parseComplete())
return QList<std::shared_ptr<const MatchCursor>>() << cursor;
QList<std::shared_ptr<const MatchCursor>> bridge_list{ cursor };
for (auto rule : this->children()) {
QList<std::shared_ptr<const MatchCursor>> current_result;
for (auto vcurs : bridge_list) {
if (!vcurs->parseFailure()) {
current_result.append(rule->parse(vcurs));
}
}
// 完全匹配的分支
decltype(current_result) temprary_list;
std::copy_if(current_result.begin(), current_result.end(),
std::back_inserter(temprary_list), [&](std::shared_ptr<const MatchCursor> ins) {
return cursor->totalErrorCount() == ins->totalErrorCount() || ins->parseComplete();
});
if (temprary_list.size()) {
bridge_list = temprary_list.mid(0,1);
continue;
}
// 经过修复的分支
std::copy_if(current_result.begin(), current_result.end(), std::back_inserter(temprary_list),
[&](std::shared_ptr<const MatchCursor> ins) { return !ins->parseFailure(); });
if (temprary_list.size()) {
bridge_list = temprary_list;
continue;
}
bridge_list = current_result;
break;
}
decltype(bridge_list) temprary_list;
// 匹配代码有进展或者匹配成功
std::copy_if(bridge_list.begin(), bridge_list.end(),
std::back_inserter(temprary_list), [&](std::shared_ptr<const MatchCursor> ins) {
return ins->operator>(*cursor) || ins->parseComplete();
});
if (temprary_list.size())
return temprary_list;
std::copy_if(bridge_list.begin(), bridge_list.end(),
std::back_inserter(temprary_list), [](std::shared_ptr<const MatchCursor> ins) { return ins->parseFailure(); });
return temprary_list;
}
QString __sequence_impl::present() const {
QString content;
for (auto& it : children())
content += it->present() + " ";
return content.mid(0, content.size() - 1);
}
__repeat_impl::__repeat_impl(std::shared_ptr<const IBasicRule> rule, int min, int max)
: rule_peer(rule), min_match(min), max_match(max) {
}
QList<std::shared_ptr<const IBasicRule>> __repeat_impl::children() const {
return QList<std::shared_ptr<const IBasicRule>>() << rule_peer;
}
#include <algorithm>
QList<std::shared_ptr<const MatchCursor>> __repeat_impl::parse(std::shared_ptr<const MatchCursor> cursor) const {
if (cursor->parseFailure() || cursor->parseComplete())
return QList<std::shared_ptr<const MatchCursor>>() << cursor;
auto syntax = present();
QList<std::shared_ptr<const MatchCursor>> max_match_begin = { cursor };
if (min_match) {
QList<std::shared_ptr<const IBasicRule>> temp_rules;
for (auto idx = 0; idx < min_match; ++idx)
temp_rules << this->rule_peer;
auto seqs_rule = std::make_shared<__sequence_impl>(temp_rules);
max_match_begin = seqs_rule->parse(cursor);
}
// 如果不满足最小重复匹配次数要求,则返回
int continue_count = std::count_if(max_match_begin.begin(), max_match_begin.end(),
[](std::shared_ptr<const MatchCursor > ins) { return !ins->parseFailure(); });
if (!continue_count)
return max_match_begin;
// 最小匹配次数中所有错误分支都是无用的、需要舍弃
for (auto idx = 0; idx < max_match_begin.size(); ++idx) {
auto current_cursor = max_match_begin.at(idx);
if (current_cursor->parseFailure())
max_match_begin.removeAt(idx--);
}
QList<std::shared_ptr<const MatchCursor>> results;
decltype(results) bridge_list = max_match_begin;
// 尝试重复匹配最大次数
for (auto idx = min_match; idx < max_match; ++idx) {
QList<std::shared_ptr<const MatchCursor>> current_list;
// 匹配迭代一次
for (auto ins : bridge_list)
current_list.append(this->rule_peer->parse(ins));
QList<QString> contents;
for (auto bx : current_list)
contents << content_extractm(bx->token()) + QStringList(bx->totalErrors()).join(',');
// 提取完全匹配的分支
QList<std::shared_ptr<const MatchCursor>> temprary_branchs;
std::copy_if(current_list.begin(), current_list.end(),
std::back_inserter(temprary_branchs), [&](std::shared_ptr<const MatchCursor> ins) {
return (cursor->totalErrorCount() == ins->totalErrorCount() && (*ins) > (*cursor)) || ins->parseComplete();
});
if (temprary_branchs.size()) {
bridge_list = temprary_branchs.mid(0, 1);
continue;
}
// 提取语法修正分支
std::copy_if(current_list.begin(), current_list.end(),
std::back_inserter(temprary_branchs), [&](std::shared_ptr<const MatchCursor> ins) {
return !ins->parseFailure() && (*ins) > (*cursor);
});
if (temprary_branchs.size()) {
bridge_list = temprary_branchs;
continue;
}
break;
}
results.append(bridge_list);
std::sort(results.begin(), results.end(),
[](std::shared_ptr<const MatchCursor> a, std::shared_ptr<const MatchCursor> b) {
return a->operator>(*b);
});
// 提取完全匹配的分支
decltype(results) rets_completely;
for (auto ins : results) {
if (ins->totalErrorCount() == cursor->totalErrorCount() && !rets_completely.size()) {
rets_completely.append(ins);
break;
}
else if (ins->parseComplete())
rets_completely.append(ins);
}
// 提取经过修正的分支
decltype(results) rets_modified;
for (auto ins : results) {
if (!ins->parseFailure()) {
if (!rets_modified.size()) {
rets_modified.append(ins);
}
else if (rets_modified.last()->token()->position() == ins->token()->position()) {
rets_modified.append(ins);
}
}
}
// 允许持续的集合
for (auto rst : rets_modified)
if (!rets_completely.contains(rst))
rets_completely.append(rst);
if (rets_completely.size())
return rets_completely;
return results;
}
QString __repeat_impl::present() const {
if (min_match == 0 && max_match == INT_MAX)
return "(" + this->rule_peer->present() + QString(")*");
else if (min_match == 1 && max_match == INT_MAX)
return "(" + this->rule_peer->present() + QString(")+");
else if (min_match == 0 && max_match == 1)
return "(" + this->rule_peer->present() + QString(")?");
return "(" + this->rule_peer->present() + QString("){%1, %2}").arg(min_match).arg(max_match);
}
SyntaxException::SyntaxException(const QString& message) {
this->msg_store = message;
}
QString SyntaxException::message() const {
return msg_store;
}
ExprRule::ExprRule(const QString& rule_name, int expr_mark)
: name_store(rule_name), mark_store(expr_mark) {
}
QString ExprRule::name() const {
return name_store;
}
int ExprRule::typeMark() const {
return this->mark_store;
}
#include <ast_novel.h>
MatchCursor::MatchCursor(const QString& path) :_file_path(path) {
}
MatchCursor::MatchCursor(std::shared_ptr<const MatchCursor> other_ptr)
: _prev_cursor(other_ptr),
_file_path(other_ptr->_file_path),
_total_errors(other_ptr->_total_errors),
_current_token(other_ptr->_current_token),
_remains_word(other_ptr->_remains_word) {
for (auto err_pack : other_ptr->_exprs_errors) {
_exprs_errors << std::make_shared<ErrsPack>(*err_pack);
}
}
bool lib_syntax::MatchCursor::operator>(const MatchCursor& other) const {
return _current_token->position() > other._current_token->position() ||
(_current_token->position() == other._current_token->position() && _total_errors.size() > other._total_errors.size());
}
std::shared_ptr<const MatchCursor> MatchCursor::previous() const {
return _prev_cursor;
}
QString MatchCursor::filePath() const {
return _file_path;
}
QString lib_syntax::MatchCursor::parseSyntax() const {
if (!this->previous())
return QString();
QString token_splitx;
switch (this->token()->tokenType()) {
case lib_token::IActionToken::Type::ElementBegin:
token_splitx = "<B>";
break;
case lib_token::IActionToken::Type::TokenBind:
token_splitx = this->token()->defines()->regex();
break;
case lib_token::IActionToken::Type::ElementEnd:
token_splitx = "<E>";
break;
}
return this->previous()->parseSyntax() + " " + token_splitx;
}
void MatchCursor::enterExprs() {
auto new_expr = std::make_shared<ErrsPack>();
this->_exprs_errors.push_back(new_expr);
}
void lib_syntax::MatchCursor::logExprsError(std::shared_ptr<const lib_words::IPrimitiveWord> t, const QString& msg) {
auto pos_key = t?t->position():0;
if(!this->_total_errors.contains(pos_key))
this->_total_errors[pos_key] = QStringList();
auto exists = this->_total_errors[pos_key];
exists.append(msg);
this->_total_errors[pos_key] = exists;
this->_exprs_errors.last()->addError(t, msg);
// 普适性质的判定标准
this->setFailure(this->exprsErrorCount() > 1 || this->_total_errors.size() > 300);
}
void MatchCursor::quitExprs() {
this->_exprs_errors.pop_back();
}
bool lib_syntax::MatchCursor::parseFailure() const {
return this->_parse_stop_with_errors;
}
void lib_syntax::MatchCursor::setFailure(bool mark) {
this->_parse_stop_with_errors = mark;
}
bool lib_syntax::MatchCursor::parseComplete() const {
return this->_parse_complete;
}
void lib_syntax::MatchCursor::setComplete(bool mark) {
this->_parse_complete = mark;
}
int MatchCursor::exprsErrorCount() const {
if (this->_exprs_errors.size())
return this->_exprs_errors.last()->errorCount();
return 0;
}
int MatchCursor::totalErrorCount() const {
return this->_total_errors.size();
}
QList<QString> MatchCursor::totalErrors() const {
QStringList flist;
for(auto set : this->_total_errors)
flist.append(set);
return flist;
}
void lib_syntax::MatchCursor::mergeWith(const MatchCursor& other) {
for(auto key : other._total_errors.keys()){
if (!this->_total_errors.contains(key))
this->_total_errors[key] = QStringList();
auto values = other._total_errors[key];
auto this_values = this->_total_errors[key];
this_values.append(values);
this->_total_errors[key] = this_values;
}
for (auto key : this->_total_errors.keys()) {
auto values = this->_total_errors[key];
values = values.toSet().toList();
this->_total_errors[key] = values;
}
}
void MatchCursor::setCurrent(std::shared_ptr<const IActionToken> t, std::shared_ptr<const IPrimitiveWord> remains) {
this->_current_token = t;
this->_remains_word = remains;
}
std::shared_ptr<const IActionToken> MatchCursor::token() const {
return this->_current_token;
}
std::shared_ptr<const IPrimitiveWord> MatchCursor::words() const {
return this->_remains_word;
}
lib_syntax::MatchCursor::ErrsPack::ErrsPack() {
}
lib_syntax::MatchCursor::ErrsPack::ErrsPack(const ErrsPack& other)
: _error_collection(other._error_collection) {
}
void lib_syntax::MatchCursor::ErrsPack::addError(std::shared_ptr<const lib_words::IPrimitiveWord> t, const QString& msg) {
this->_error_collection << std::make_pair(t, msg);
}
QList<std::pair<std::shared_ptr<const lib_words::IPrimitiveWord>, QString>> MatchCursor::ErrsPack::errors() const {
return _error_collection;
}
uint64_t MatchCursor::ErrsPack::errorCount() const {
return _error_collection.size();
}