2021-04-24 11:53:36 +00:00
|
|
|
|
#include <iostream>
|
|
|
|
|
#include <ctime>
|
|
|
|
|
#include <fstream>
|
|
|
|
|
#include <vector>
|
|
|
|
|
#include <string>
|
|
|
|
|
#include <sstream>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
#include <codecvt>
|
2021-04-24 11:53:36 +00:00
|
|
|
|
#include <set>
|
|
|
|
|
#include <map>
|
2021-04-27 04:04:27 +00:00
|
|
|
|
#include <functional>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
#include <iomanip>
|
2021-04-29 12:14:20 +00:00
|
|
|
|
#include <algorithm>
|
2021-04-30 06:07:59 +00:00
|
|
|
|
#include <regex>
|
|
|
|
|
#include <stack>
|
|
|
|
|
#include <queue>
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
|
|
|
|
using namespace std;
|
|
|
|
|
|
|
|
|
|
using std::vector;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
using std::wstring;
|
|
|
|
|
using std::wstringstream;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
using std::pair;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
using std::wcout;
|
|
|
|
|
using std::endl;
|
|
|
|
|
using std::to_string;
|
2021-04-27 04:04:27 +00:00
|
|
|
|
using std::hash;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
using std::setw;
|
2021-04-30 06:07:59 +00:00
|
|
|
|
using std::stack;
|
|
|
|
|
using std::queue;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
|
|
|
|
struct Symbol {
|
|
|
|
|
|
|
|
|
|
const int index;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
wstring name;
|
|
|
|
|
bool terminator;
|
|
|
|
|
bool start;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
Symbol(int index, wstring name, bool terminator, bool start):
|
2021-04-24 11:53:36 +00:00
|
|
|
|
index(index),
|
2021-04-25 04:01:26 +00:00
|
|
|
|
name(std::move(name)),
|
2021-04-25 18:24:29 +00:00
|
|
|
|
terminator(terminator),
|
|
|
|
|
start(start)
|
2021-04-24 11:53:36 +00:00
|
|
|
|
{}
|
|
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
class SymbolTable {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
int index = 1;
|
|
|
|
|
|
|
|
|
|
map<wstring, Symbol *> table;
|
|
|
|
|
|
|
|
|
|
map<int, Symbol *> cache;
|
|
|
|
|
|
|
|
|
|
vector<const Symbol *> line;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
|
|
|
|
public:
|
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
SymbolTable() {
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
auto symbol = new Symbol(0, L"<EFBFBD><EFBFBD>", true, false);
|
|
|
|
|
table.insert(pair<wstring, Symbol *>(L"<EFBFBD><EFBFBD>", symbol));
|
2021-04-25 18:24:29 +00:00
|
|
|
|
cache.insert(pair<int, Symbol *>(0, symbol));
|
|
|
|
|
line.push_back(symbol);
|
|
|
|
|
|
|
|
|
|
symbol = new Symbol(-1, L"$", true, false);
|
|
|
|
|
table.insert(pair<wstring, Symbol *>(L"$", symbol));
|
|
|
|
|
cache.insert(pair<int, Symbol *>(-1, symbol));
|
|
|
|
|
line.push_back(symbol);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const vector<const Symbol *> &getAllSymbols() const {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
return line;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int addSymbol(const wstring& name, bool terminator) {
|
|
|
|
|
|
|
|
|
|
Symbol *symbol = nullptr;
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
if(name == L"<EFBFBD><EFBFBD>") {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
return 0;
|
|
|
|
|
} else if (name[0] == L'@') {
|
|
|
|
|
symbol = new Symbol(index, name, terminator, true);
|
|
|
|
|
} else {
|
|
|
|
|
symbol = new Symbol(index, name, terminator, false);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
const auto &it = table.find(name);
|
2021-04-25 04:01:26 +00:00
|
|
|
|
if (it != table.end()) {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
return it->second->index;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
table.insert(pair<wstring, Symbol *>(symbol->name, symbol));
|
|
|
|
|
cache.insert(pair<int, Symbol *>(symbol->index, symbol));
|
|
|
|
|
line.push_back(symbol);
|
|
|
|
|
|
|
|
|
|
index++;
|
|
|
|
|
|
|
|
|
|
return symbol->index;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-25 04:01:26 +00:00
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const Symbol *getSymbol(int symbol_index) const {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
const auto &it = cache.find(symbol_index);
|
|
|
|
|
if(it != cache.end()) {
|
|
|
|
|
return it->second;
|
|
|
|
|
} else {
|
|
|
|
|
throw runtime_error("symbol " + to_string(symbol_index) + " NOT Found");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] int getSymbolIndex(const wstring &name) const {
|
2021-04-25 04:01:26 +00:00
|
|
|
|
const auto &it = table.find(name);
|
|
|
|
|
if(it != table.end()) {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
return it->second->index;
|
2021-04-25 04:01:26 +00:00
|
|
|
|
} else {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
throw runtime_error("symbol NOT Found");
|
2021-04-25 04:01:26 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
void modifySymbol(int idx, const wstring &name, bool terminator, bool start) {
|
|
|
|
|
auto it = cache.find(idx);
|
|
|
|
|
if(it != cache.end()) {
|
|
|
|
|
auto p_sym = it->second;
|
|
|
|
|
p_sym->name = name;
|
|
|
|
|
p_sym->terminator = terminator;
|
|
|
|
|
p_sym->start = start;
|
2021-04-27 04:04:27 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const Symbol *getStartSymbol() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
for(const auto & symbol : getAllSymbols()) {
|
|
|
|
|
if(symbol->start) {
|
|
|
|
|
return symbol;
|
|
|
|
|
}
|
2021-04-27 04:04:27 +00:00
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
throw runtime_error("start symbol NOT Found");
|
2021-04-27 04:04:27 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD>ʽ
|
2021-04-29 10:55:04 +00:00
|
|
|
|
struct Production {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
const int index;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
const int left;
|
|
|
|
|
const vector<int> right;
|
2021-04-27 04:04:27 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
Production(int index, int left, vector<int> right): index(index), left(left), right(std::move(right)) {}
|
2021-04-27 04:04:27 +00:00
|
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><EFBFBD><EFB7A8>Դ<EFBFBD><D4B4>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
class GrammarResourcePool {
|
2021-04-25 04:01:26 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
int pdt_index = 0;
|
|
|
|
|
|
|
|
|
|
// <20><><EFBFBD>ű<EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
SymbolTable symbolTable;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD>ʽ
|
2021-04-29 10:55:04 +00:00
|
|
|
|
vector<const Production *> productions;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// FIRST<53><54><EFBFBD><EFBFBD><EFBFBD>洢<EFBFBD><E6B4A2>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
map<int, const set<int> *> firsts;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// FOLLOW<4F><57><EFBFBD><EFBFBD><EFBFBD>洢<EFBFBD><E6B4A2>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
map<int, set<int> *> follows;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// ȥ<><C8A5><EFBFBD><EFBFBD>β<EFBFBD>ո<EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
static wstring& trim(wstring &&str) {
|
|
|
|
|
if (str.empty()) {
|
|
|
|
|
return str;
|
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
str.erase(0,str.find_first_not_of(' '));
|
|
|
|
|
str.erase(str.find_last_not_of(' ') + 1);
|
|
|
|
|
return str;
|
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
public:
|
|
|
|
|
|
|
|
|
|
const set<int > *FIRST(const vector<int> &symbols, int start_index) {
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD>ɼ<EFBFBD><C9BC><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
auto *non_terminator_symbols = new set<int>();
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
for(int i = start_index; i < symbols.size(); i++) {
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
const auto p_non_term_set = FIRST(symbols[i]);
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
non_terminator_symbols->insert(p_non_term_set->begin(), p_non_term_set->end());
|
|
|
|
|
|
|
|
|
|
const auto sec_it = p_non_term_set->find(0);
|
|
|
|
|
if(sec_it != p_non_term_set->end()) {
|
|
|
|
|
continue;
|
|
|
|
|
} else {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return non_terminator_symbols;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
const set<int>* FIRST(int symbol) {
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD>һ<EFBFBD><D2BB><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
const auto it = firsts.find(symbol);
|
|
|
|
|
if(it != firsts.end()) {
|
|
|
|
|
return it->second;
|
|
|
|
|
}
|
2021-04-25 04:01:26 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD>ɼ<EFBFBD><C9BC><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
auto *non_terminator_symbols = new set<int>();
|
2021-04-25 04:01:26 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ս<EFBFBD><D5BD><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
if(symbolTable.getSymbol(symbol)->terminator) {
|
|
|
|
|
non_terminator_symbols->insert(symbol);
|
|
|
|
|
} else {
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
bool production_found = false;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD>ÿһ<C3BF><D2BB><EFBFBD><EFBFBD>ʽ
|
2021-04-25 18:24:29 +00:00
|
|
|
|
for (const auto &production : productions) {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
const Production *p_pdt = production;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
if (p_pdt->left != symbol) continue;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
production_found = true;
|
|
|
|
|
|
|
|
|
|
for (const auto &right_symbol : p_pdt->right) {
|
|
|
|
|
|
|
|
|
|
const auto p_non_term_set = FIRST(right_symbol);
|
|
|
|
|
|
|
|
|
|
non_terminator_symbols->insert(p_non_term_set->begin(), p_non_term_set->end());
|
|
|
|
|
|
|
|
|
|
const auto sec_it = p_non_term_set->find(0);
|
|
|
|
|
|
|
|
|
|
if(sec_it != p_non_term_set->end()) {
|
|
|
|
|
continue;
|
|
|
|
|
} else {
|
|
|
|
|
break;
|
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
if (!production_found) non_terminator_symbols->insert(0);
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
this->firsts.insert(pair<int, const set<int> *>(symbol, non_terminator_symbols));
|
2021-04-25 04:01:26 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
return non_terminator_symbols;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-25 04:01:26 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
const set<int> *FOLLOW(int symbol) {
|
|
|
|
|
if(follows.empty()) {
|
|
|
|
|
FOLLOW();
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
const auto it = follows.find(symbol);
|
|
|
|
|
if(it != follows.end()) {
|
|
|
|
|
return it->second;
|
|
|
|
|
} else {
|
|
|
|
|
throw runtime_error("symbol NOT Found");
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
void FOLLOW() {
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
for (const auto &symbol : symbolTable.getAllSymbols()) {
|
|
|
|
|
if (!symbol->terminator) {
|
|
|
|
|
if (symbol->start) {
|
|
|
|
|
set<int> *non_terminator_symbols = get_follow_set(symbol->index);
|
|
|
|
|
non_terminator_symbols->insert(-1);
|
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// ָ<><D6B8>û<EFBFBD><C3BB><EFBFBD>µķ<C2B5><C4B7>ű<EFBFBD><C5B1><EFBFBD><EFBFBD>ӵ<EFBFBD><D3B5><EFBFBD><EFBFBD><EFBFBD>FOLLOW<4F><57><EFBFBD><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
bool ifAdded = true;
|
|
|
|
|
|
|
|
|
|
while(ifAdded) {
|
|
|
|
|
|
|
|
|
|
ifAdded = false;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
set<int> *non_terminator_symbols = nullptr;
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
for (const auto &production : productions) {
|
|
|
|
|
|
|
|
|
|
const auto &right_symbols = production->right;
|
|
|
|
|
|
|
|
|
|
set<int> equal_left_non_terminators;
|
|
|
|
|
|
|
|
|
|
for (int i = 0; i < right_symbols.size() - 1; i++) {
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD>ս<EFBFBD><D5BD><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
if (!symbolTable.getSymbol(right_symbols[i])->terminator) {
|
|
|
|
|
|
|
|
|
|
const auto p_non_term_set = FIRST(right_symbols, i + 1);
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD>FOLLOW<4F><57>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
non_terminator_symbols = get_follow_set(right_symbols[i]);
|
|
|
|
|
|
|
|
|
|
const size_t set_size = non_terminator_symbols->size();
|
|
|
|
|
|
|
|
|
|
non_terminator_symbols->insert(p_non_term_set->begin(), p_non_term_set->end());
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20>ڼ<EFBFBD><DABC><EFBFBD><EFBFBD>з<EFBFBD><D0B7>ֿ<EFBFBD><D6BF>ַ<EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
if(non_terminator_symbols->find(0) != non_terminator_symbols->end()) {
|
|
|
|
|
non_terminator_symbols->erase(0);
|
|
|
|
|
equal_left_non_terminators.insert(right_symbols[i]);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD><EFBFBD>Ƿ<EFBFBD><C7B7><EFBFBD><EFBFBD>µ<EFBFBD><C2B5>ս<EFBFBD><D5BD><EFBFBD><EFBFBD>ű<EFBFBD><C5B1><EFBFBD><EFBFBD><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
if(set_size < non_terminator_symbols->size()) {
|
|
|
|
|
ifAdded = true;
|
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
if(!right_symbols.empty()) {
|
|
|
|
|
if (!symbolTable.getSymbol(right_symbols[right_symbols.size() - 1])->terminator) {
|
|
|
|
|
equal_left_non_terminators.insert(right_symbols[right_symbols.size() - 1]);
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
for(const auto symbol : equal_left_non_terminators) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>߷<EFBFBD><DFB7>ս<EFBFBD><D5BD><EFBFBD><EFBFBD><EFBFBD>FOLLOW<4F><57>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
const auto left_non_terminator_symbols = get_follow_set(production->left);
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD>FOLLOW<4F><57>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
non_terminator_symbols = get_follow_set(symbol);
|
|
|
|
|
|
|
|
|
|
const size_t set_size = non_terminator_symbols->size();
|
|
|
|
|
|
|
|
|
|
non_terminator_symbols->insert(
|
|
|
|
|
left_non_terminator_symbols->begin(),
|
|
|
|
|
left_non_terminator_symbols->end());
|
|
|
|
|
|
|
|
|
|
if(non_terminator_symbols->find(0) != non_terminator_symbols->end()) {
|
|
|
|
|
non_terminator_symbols->erase(0);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD><EFBFBD>Ƿ<EFBFBD><C7B7><EFBFBD><EFBFBD>µ<EFBFBD><C2B5>ս<EFBFBD><D5BD><EFBFBD><EFBFBD>ű<EFBFBD><C5B1><EFBFBD><EFBFBD><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
if(set_size < non_terminator_symbols->size()) {
|
|
|
|
|
ifAdded = true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
set<int>* get_follow_set(int symbol) {
|
|
|
|
|
|
|
|
|
|
set<int> *non_terminator_symbols = nullptr;
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD>һ<EFBFBD><D2BB><EFBFBD>
|
2021-04-25 18:24:29 +00:00
|
|
|
|
auto it = follows.find(symbol);
|
|
|
|
|
if(it != follows.end()) {
|
|
|
|
|
non_terminator_symbols = it->second;
|
|
|
|
|
} else {
|
|
|
|
|
non_terminator_symbols = new set<int>();
|
|
|
|
|
this->follows.insert(pair<int, set<int> *>(symbol, non_terminator_symbols));
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
return non_terminator_symbols;
|
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
void print_symbols(const set<int> &symbols_index) {
|
|
|
|
|
wcout << L"{ ";
|
|
|
|
|
for(const auto & symbol_index : symbols_index) {
|
|
|
|
|
auto *p_sym = symbolTable.getSymbol(symbol_index);
|
|
|
|
|
|
|
|
|
|
if(p_sym->terminator) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
if (p_sym->name == L"<EFBFBD><EFBFBD>") {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
wcout << L" [Epsilon] ";
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
else wcout << L" \"" << p_sym->name << L"\" ";
|
|
|
|
|
} else {
|
|
|
|
|
wcout << L" " << p_sym->name << L" ";
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
wcout << L"}" << endl;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
void parse_production_string_line(const wstring &temp_line) {
|
|
|
|
|
auto middle_index = temp_line.find(L"->", 0);
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
if(middle_index == string::npos) {
|
|
|
|
|
throw runtime_error("-> NOT FOUND");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
wstring front = trim(temp_line.substr(0, middle_index));
|
|
|
|
|
int left = symbolTable.addSymbol(front, false);
|
|
|
|
|
|
|
|
|
|
wstring back = trim(temp_line.substr(middle_index + 2, temp_line.size() - middle_index - 2));
|
|
|
|
|
|
|
|
|
|
wstringstream terminator, non_terminator;
|
|
|
|
|
vector<int> symbols;
|
|
|
|
|
bool is_terminator = false;
|
|
|
|
|
for(const auto &c : back) {
|
|
|
|
|
if (c == L'\"') {
|
|
|
|
|
if(is_terminator) {
|
|
|
|
|
symbols.push_back(symbolTable.addSymbol(trim(terminator.str()), true));
|
|
|
|
|
terminator.str(L"");
|
|
|
|
|
terminator.clear();
|
|
|
|
|
}
|
|
|
|
|
is_terminator = !is_terminator;
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
if(c == L' ' || c == L'\r') {
|
|
|
|
|
wstring temp_symbol = trim(non_terminator.str());
|
|
|
|
|
if(!temp_symbol.empty()) {
|
|
|
|
|
symbols.push_back(symbolTable.addSymbol(trim(non_terminator.str()), false));
|
|
|
|
|
non_terminator.str(L"");
|
|
|
|
|
non_terminator.clear();
|
|
|
|
|
}
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
if(is_terminator) {
|
|
|
|
|
terminator << c;
|
|
|
|
|
} else {
|
|
|
|
|
non_terminator << c;
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-30 05:33:22 +00:00
|
|
|
|
wstring temp_symbol = trim(non_terminator.str());
|
|
|
|
|
if(!temp_symbol.empty()) {
|
|
|
|
|
symbols.push_back(symbolTable.addSymbol(trim(non_terminator.str()), false));
|
|
|
|
|
}
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
auto p_pdt = new Production(pdt_index++, left, symbols);
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
productions.push_back(p_pdt);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const vector<const Production *> &get_productions() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return productions;
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const Symbol *getSymbol(int symbol_index) const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return symbolTable.getSymbol(symbol_index);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const Symbol *getStartSymbol() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return symbolTable.getStartSymbol();
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
int addSymbol(const wstring &name, bool terminator) {
|
|
|
|
|
return symbolTable.addSymbol(name, terminator);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const Production *addProduction(int left, initializer_list<int> right) {
|
|
|
|
|
vector<int> right_vector;
|
|
|
|
|
for(int symbol : right) {
|
|
|
|
|
right_vector.push_back(symbol);
|
|
|
|
|
}
|
2021-04-30 05:33:22 +00:00
|
|
|
|
auto p_pdt = new Production(pdt_index++, left, right_vector);
|
2021-04-29 10:55:04 +00:00
|
|
|
|
productions.push_back(p_pdt);
|
|
|
|
|
return p_pdt;
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const vector<const Symbol *> &getAllSymbols() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return symbolTable.getAllSymbols();
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void modifySymbol(int index, const wstring &name, bool terminator, bool start) {
|
|
|
|
|
symbolTable.modifySymbol(index, name, terminator, start);
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
class Item{
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><>Ӧ<EFBFBD>IJ<EFBFBD><C4B2><EFBFBD>ʽ
|
2021-04-29 10:55:04 +00:00
|
|
|
|
const Production* const production;
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD>λ<EFBFBD><CEBB>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
int dot_index = 0;
|
|
|
|
|
|
|
|
|
|
const int terminator = 0;
|
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
public:
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
const bool generated = false;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
explicit Item(const Production *p_pdt, int m_terminator, bool m_generated = false)
|
|
|
|
|
: production(p_pdt), terminator(m_terminator), generated(m_generated) {}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
void set_dot_index(int m_dot_index) {
|
|
|
|
|
if(m_dot_index > production->right.size()) {
|
|
|
|
|
throw runtime_error("DOT_INDEX out of range");
|
|
|
|
|
}
|
|
|
|
|
this->dot_index = m_dot_index;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] int get_dot_index() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return dot_index;
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] int get_dot_next_symbol() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
if(get_dot_index() == production->right.size()) {
|
|
|
|
|
return 0;
|
|
|
|
|
} else {
|
|
|
|
|
return production->right[dot_index];
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] int get_dot_next_i_symbol(int i) const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
if(get_dot_index() + i >= production->right.size()) {
|
|
|
|
|
return 0;
|
|
|
|
|
} else {
|
|
|
|
|
return production->right[dot_index + i];
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] int get_terminator() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return terminator;
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const Production *get_production() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return production;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-29 10:55:04 +00:00
|
|
|
|
};
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
class ItemCollectionManager;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
class ItemCollection{
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
int index = 0;
|
|
|
|
|
|
|
|
|
|
map<size_t, Item *> items;
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
vector<Item *> cache;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
GrammarResourcePool *pool;
|
|
|
|
|
|
|
|
|
|
friend ItemCollectionManager;
|
|
|
|
|
|
|
|
|
|
template <class T>
|
|
|
|
|
inline void hash_combine(std::size_t& seed, const T& v) const
|
|
|
|
|
{
|
|
|
|
|
std::hash<T> hasher;
|
|
|
|
|
seed ^= hasher(v) + 0x9e3779b9 + (seed<<6) + (seed>>2);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
static bool compare_item_ptr(const Item* lhs, const Item* rhs)
|
|
|
|
|
{
|
|
|
|
|
if(lhs->get_production() != rhs->get_production())
|
|
|
|
|
return lhs->get_production() < rhs->get_production();
|
|
|
|
|
else if(lhs->get_dot_index() != rhs->get_dot_index())
|
|
|
|
|
return lhs->get_dot_index() < rhs->get_dot_index();
|
|
|
|
|
else
|
|
|
|
|
return lhs->get_terminator() < rhs->get_terminator();
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
public:
|
|
|
|
|
|
|
|
|
|
explicit ItemCollection(GrammarResourcePool *pool) : pool(pool) {
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const vector<Item *> &getItems() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return cache;
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] int getIndex() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return index;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
bool addItem(const Production *p_pdt, int dot_index, int terminator, bool generated = false) {
|
|
|
|
|
auto hasher = hash<int>();
|
|
|
|
|
size_t seed = hasher(reinterpret_cast<const int>(p_pdt));
|
|
|
|
|
hash_combine(seed, dot_index);
|
|
|
|
|
hash_combine(seed, terminator);
|
|
|
|
|
|
|
|
|
|
auto it = items.find(seed);
|
|
|
|
|
if(it != items.end()) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
auto *p_item = new Item(p_pdt, terminator, generated);
|
|
|
|
|
p_item->set_dot_index(dot_index);
|
|
|
|
|
items.insert(pair<size_t, Item *>(seed, p_item));
|
|
|
|
|
cache.push_back(p_item);
|
|
|
|
|
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void CLOSURE() {
|
|
|
|
|
|
|
|
|
|
bool ifAdd = true;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
while(ifAdd) {
|
|
|
|
|
ifAdd = false;
|
|
|
|
|
|
|
|
|
|
for(const auto & item : items) {
|
|
|
|
|
int next_symbol = item.second->get_dot_next_symbol();
|
|
|
|
|
|
|
|
|
|
if(next_symbol == 0
|
|
|
|
|
|| pool->getSymbol(next_symbol)->terminator) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
for(auto *production : pool->get_productions()) {
|
|
|
|
|
if(production->left == next_symbol) {
|
|
|
|
|
vector<int> first_args;
|
|
|
|
|
first_args.push_back(item.second->get_dot_next_i_symbol(1));
|
|
|
|
|
first_args.push_back(item.second->get_terminator());
|
|
|
|
|
|
|
|
|
|
const auto first_set = pool->FIRST(first_args, 0);
|
|
|
|
|
for(auto terminator : *first_set) {
|
|
|
|
|
if(terminator == 0) continue;
|
|
|
|
|
if(this->addItem(production, 0, terminator, true)) {
|
|
|
|
|
ifAdd = true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void print() const {
|
|
|
|
|
|
|
|
|
|
wcout << L"I" << index << L": ";
|
|
|
|
|
|
|
|
|
|
for(const auto item : cache) {
|
|
|
|
|
const auto *p_pdt = item->get_production();
|
|
|
|
|
int dot_index = item->get_dot_index();
|
|
|
|
|
wcout << pool->getSymbol(p_pdt->left)->name << L" -> " ;
|
|
|
|
|
int i = 0;
|
2021-04-30 05:33:22 +00:00
|
|
|
|
for(const auto &symbol_index : p_pdt->right) {
|
|
|
|
|
|
|
|
|
|
if(i > 0) wcout << " ";
|
|
|
|
|
if(i++ == dot_index) wcout << "<EFBFBD><EFBFBD>";
|
|
|
|
|
|
|
|
|
|
auto *symbol = pool->getSymbol(symbol_index);
|
|
|
|
|
|
|
|
|
|
if(!symbol->index) {
|
|
|
|
|
wcout << L"[Epsilon]";
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if(!symbol->terminator)
|
|
|
|
|
wcout << pool->getSymbol(symbol_index)->name;
|
|
|
|
|
else
|
|
|
|
|
wcout << L'"' << pool->getSymbol(symbol_index)->name << L'"';
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
if(i++ == dot_index) wcout << "<EFBFBD><EFBFBD>";
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
wcout << L", \"" << pool->getSymbol(item->get_terminator())->name << "\"" << endl;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
|
|
|
|
cout << endl;
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] size_t getHash() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
size_t seed = 0;
|
2021-04-29 12:14:20 +00:00
|
|
|
|
|
|
|
|
|
vector<Item *> cache_sorted(cache.begin(), cache.end());
|
|
|
|
|
sort(cache_sorted.begin(), cache_sorted.end(), compare_item_ptr);
|
|
|
|
|
|
|
|
|
|
for(const auto item : cache_sorted) {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
if(item->generated) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
hash_combine(seed, item->get_production());
|
|
|
|
|
hash_combine(seed, item->get_dot_index());
|
|
|
|
|
hash_combine(seed, item->get_terminator());
|
|
|
|
|
}
|
|
|
|
|
return seed;
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
class ItemCollectionManager{
|
|
|
|
|
|
|
|
|
|
int index = 0;
|
|
|
|
|
|
|
|
|
|
map<size_t, ItemCollection *> ic_map;
|
|
|
|
|
|
|
|
|
|
map<size_t, ItemCollection *> ic_content_map;
|
|
|
|
|
|
|
|
|
|
vector<const ItemCollection *> ics;
|
|
|
|
|
|
|
|
|
|
GrammarResourcePool *pool;
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
const Production *start_pdt{};
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
template <class T>
|
|
|
|
|
inline void hash_combine(std::size_t& seed, const T& v) const
|
|
|
|
|
{
|
|
|
|
|
std::hash<T> hasher;
|
|
|
|
|
seed ^= hasher(v) + 0x9e3779b9 + (seed<<6) + (seed>>2);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public:
|
|
|
|
|
|
|
|
|
|
explicit ItemCollectionManager(GrammarResourcePool *resource_pool) : pool(resource_pool) {
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void buildItems() {
|
|
|
|
|
|
|
|
|
|
const auto startSymbol = pool->getStartSymbol();
|
|
|
|
|
|
|
|
|
|
wstring new_symbol_name = startSymbol->name + L"'";
|
|
|
|
|
|
|
|
|
|
int new_symbol_index = pool->addSymbol(new_symbol_name, startSymbol->terminator);
|
|
|
|
|
|
|
|
|
|
pool->modifySymbol(startSymbol->index, startSymbol->name.substr(1), false, false);
|
|
|
|
|
|
|
|
|
|
const auto *p_pdt = pool->addProduction(new_symbol_index, {startSymbol->index});
|
|
|
|
|
|
|
|
|
|
this->start_pdt = p_pdt;
|
|
|
|
|
|
|
|
|
|
auto *pi_ic = new ItemCollection(pool);
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// -1 <20><><EFBFBD><EFBFBD> $
|
2021-04-29 10:55:04 +00:00
|
|
|
|
pi_ic->addItem(p_pdt, 0, -1);
|
|
|
|
|
|
|
|
|
|
pi_ic->CLOSURE();
|
|
|
|
|
|
|
|
|
|
addItemCollection(0, 0, pi_ic);
|
|
|
|
|
|
|
|
|
|
bool ifAdd = true;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
while(ifAdd) {
|
|
|
|
|
|
|
|
|
|
ifAdd = false;
|
|
|
|
|
const auto &r_ics = getItemCollections();
|
|
|
|
|
vector<const ItemCollection *> temp_ics(r_ics.begin(), r_ics.end());
|
|
|
|
|
for(const auto ic : temp_ics) {
|
|
|
|
|
for(const auto symbol : pool->getAllSymbols()) {
|
|
|
|
|
if(symbol->index <= 0) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
if(GOTO(ic, symbol->index)) {
|
|
|
|
|
ifAdd = true;
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const Production *getStartProduction() const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return start_pdt;
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const vector<const ItemCollection *> &getItemCollections() const{
|
2021-04-29 10:55:04 +00:00
|
|
|
|
return ics;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
ItemCollection *getItemCollectionByHash(size_t hash) {
|
|
|
|
|
ItemCollection *p_ic = nullptr;
|
|
|
|
|
auto it = ic_content_map.find(hash);
|
|
|
|
|
if(it != ic_content_map.end()) {
|
|
|
|
|
p_ic = it->second;
|
|
|
|
|
}
|
|
|
|
|
return p_ic;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool addItemCollection(int idx, int symbol, ItemCollection *p_ic){
|
|
|
|
|
|
|
|
|
|
size_t ic_hash = p_ic->getHash();
|
|
|
|
|
auto it = ic_content_map.find(ic_hash);
|
|
|
|
|
if (it != ic_content_map.end()) {
|
|
|
|
|
p_ic = it->second;
|
|
|
|
|
} else {
|
|
|
|
|
p_ic->index = this->index++;
|
|
|
|
|
ic_content_map.insert(pair<size_t, ItemCollection *>(ic_hash, p_ic));
|
|
|
|
|
ics.push_back(p_ic);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
auto hasher = hash<int>();
|
|
|
|
|
size_t seed = hasher(idx);
|
|
|
|
|
hash_combine(seed, symbol);
|
|
|
|
|
|
|
|
|
|
auto it2 = ic_map.find(seed);
|
|
|
|
|
if(it2 != ic_map.end()) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
if(symbol != 0) {
|
|
|
|
|
auto p_symbol = pool->getSymbol(symbol);
|
|
|
|
|
if(p_symbol->terminator)
|
|
|
|
|
wcout << L"GOTO(" << idx << L", \"" << p_symbol->name << L"\")" << endl;
|
|
|
|
|
else
|
|
|
|
|
wcout << L"GOTO(" << idx << L", " << p_symbol->name << L")" << endl;
|
|
|
|
|
} else {
|
|
|
|
|
wcout << L"GOTO(" << idx << L", [Epsilon])" << endl;
|
|
|
|
|
}
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
ic_map.insert(pair<size_t, ItemCollection *>(seed, p_ic));
|
|
|
|
|
p_ic->print();
|
|
|
|
|
return true;
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 12:14:20 +00:00
|
|
|
|
[[nodiscard]] const ItemCollection* getGOTO(int idx, int symbol) const {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
auto hasher = hash<int>();
|
|
|
|
|
size_t seed = hasher(idx);
|
|
|
|
|
hash_combine(seed, symbol);
|
|
|
|
|
|
|
|
|
|
auto it = ic_map.find(seed);
|
|
|
|
|
if(it != ic_map.end()) {
|
|
|
|
|
return it->second;
|
|
|
|
|
} else {
|
|
|
|
|
return nullptr;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
bool GOTO(const ItemCollection *p_ic, int symbol) {
|
|
|
|
|
auto *pt_ic = new ItemCollection(pool);
|
|
|
|
|
|
|
|
|
|
for(const auto &item : p_ic->cache) {
|
|
|
|
|
if(item->get_dot_next_symbol() == symbol) {
|
|
|
|
|
pt_ic->addItem(item->get_production(), item->get_dot_index() + 1, item->get_terminator());
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
auto p_temp_ic = this->getItemCollectionByHash(pt_ic->getHash());
|
|
|
|
|
if(p_temp_ic == nullptr)
|
|
|
|
|
pt_ic->CLOSURE();
|
|
|
|
|
else pt_ic = p_temp_ic;
|
|
|
|
|
|
|
|
|
|
if(!pt_ic->items.empty()) {
|
|
|
|
|
return this->addItemCollection(p_ic->index, symbol, pt_ic);
|
|
|
|
|
} else {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
class AnalyseTableGenerator {
|
|
|
|
|
|
|
|
|
|
using Action = enum {
|
|
|
|
|
MOVE, STATUTE, ACC, STEP_GOTO
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
struct Step {
|
|
|
|
|
|
|
|
|
|
const Action action;
|
2021-04-29 12:14:20 +00:00
|
|
|
|
union Target{
|
2021-04-29 10:55:04 +00:00
|
|
|
|
int index;
|
|
|
|
|
const Production *production;
|
2021-04-29 12:14:20 +00:00
|
|
|
|
} target{};
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
Step(Action action, int index) : action(action), target(Target{index}){}
|
2021-04-29 12:14:20 +00:00
|
|
|
|
Step(Action action, const Production *p_pdt) : action(action) {
|
|
|
|
|
target.production = p_pdt;
|
|
|
|
|
}
|
2021-04-29 10:55:04 +00:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
map<size_t, Step *> ACTION;
|
|
|
|
|
|
|
|
|
|
map<size_t, Step *> GOTO;
|
|
|
|
|
|
|
|
|
|
const ItemCollectionManager *icm;
|
|
|
|
|
|
|
|
|
|
const GrammarResourcePool *pool;
|
|
|
|
|
|
|
|
|
|
template <class T>
|
|
|
|
|
inline void hash_combine(std::size_t& seed, const T& v) const
|
|
|
|
|
{
|
|
|
|
|
std::hash<T> hasher;
|
|
|
|
|
seed ^= hasher(v) + 0x9e3779b9 + (seed<<6) + (seed>>2);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void add_action(int index, int terminator_symbol, Action action, const Production *target_pdt) {
|
|
|
|
|
size_t seed = 0;
|
|
|
|
|
hash_combine(seed, index);
|
|
|
|
|
hash_combine(seed, terminator_symbol);
|
|
|
|
|
|
|
|
|
|
auto it = ACTION.find(seed);
|
|
|
|
|
if(it == ACTION.end()) {
|
|
|
|
|
auto step = new Step(action, target_pdt);
|
|
|
|
|
ACTION.insert(pair<size_t, Step *>(seed, step));
|
|
|
|
|
} else {
|
|
|
|
|
if(it->second->action != action || it->second->target.production != target_pdt)
|
|
|
|
|
throw runtime_error("Conflict Occurred, Syntax NOT LR(1)");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void add_action(int index, int terminator_symbol, Action action, int target_index) {
|
|
|
|
|
size_t seed = 0;
|
|
|
|
|
hash_combine(seed, index);
|
|
|
|
|
hash_combine(seed, terminator_symbol);
|
|
|
|
|
|
|
|
|
|
auto it = ACTION.find(seed);
|
|
|
|
|
if(it == ACTION.end()) {
|
|
|
|
|
auto step = new Step(action, target_index);
|
|
|
|
|
ACTION.insert(pair<size_t, Step *>(seed, step));
|
|
|
|
|
} else {
|
|
|
|
|
if(it->second->action != action || it->second->target.index != target_index)
|
|
|
|
|
throw runtime_error("Conflict Occurred, Syntax NOT LR(1)");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void add_goto(int index, int non_terminator_symbol, int target_index) {
|
|
|
|
|
size_t seed = 0;
|
|
|
|
|
hash_combine(seed, index);
|
|
|
|
|
hash_combine(seed, non_terminator_symbol);
|
|
|
|
|
|
|
|
|
|
auto it = GOTO.find(seed);
|
|
|
|
|
if(it == GOTO.end()) {
|
|
|
|
|
auto step = new Step(STEP_GOTO, target_index);
|
|
|
|
|
GOTO.insert(pair<size_t, Step *>(seed, step));
|
|
|
|
|
} else {
|
|
|
|
|
if(it->second->target.index != target_index)
|
|
|
|
|
throw runtime_error("Conflict Occurred, Syntax NOT LR(1)");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public:
|
|
|
|
|
|
|
|
|
|
explicit AnalyseTableGenerator(const GrammarResourcePool *p_pool, const ItemCollectionManager *p_icm)
|
|
|
|
|
:pool(p_pool) , icm(p_icm) {
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void generate() {
|
|
|
|
|
const auto &ics = icm->getItemCollections();
|
|
|
|
|
for(const auto *ic : ics) {
|
|
|
|
|
for(const auto *item : ic->getItems()) {
|
|
|
|
|
if(item->get_production() == icm->getStartProduction()
|
|
|
|
|
&& item->get_dot_next_symbol() == 0
|
|
|
|
|
&& item->get_terminator() == -1) {
|
|
|
|
|
this->add_action(ic->getIndex(), -1, ACC, 0);
|
|
|
|
|
}
|
|
|
|
|
int next_symbol = item->get_dot_next_symbol();
|
|
|
|
|
if(next_symbol != 0) {
|
|
|
|
|
const auto *p_ic = icm->getGOTO(ic->getIndex(), next_symbol);
|
|
|
|
|
if(pool->getSymbol(next_symbol)->terminator) {
|
|
|
|
|
if (p_ic != nullptr) {
|
|
|
|
|
this->add_action(ic->getIndex(), next_symbol, MOVE, p_ic->getIndex());
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
if (p_ic != nullptr) {
|
|
|
|
|
this->add_goto(ic->getIndex(), next_symbol, p_ic->getIndex());
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else {
|
2021-04-29 13:46:57 +00:00
|
|
|
|
if(pool->getSymbol(next_symbol)->terminator) {
|
|
|
|
|
if (item->get_production()->left != pool->getStartSymbol()->index) {
|
|
|
|
|
this->add_action(ic->getIndex(), item->get_terminator(), STATUTE, item->get_production());
|
|
|
|
|
}
|
2021-04-25 18:24:29 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const Step *findActionStep(int index, int terminator_symbol) {
|
|
|
|
|
size_t seed = 0;
|
|
|
|
|
hash_combine(seed, index);
|
|
|
|
|
hash_combine(seed, terminator_symbol);
|
|
|
|
|
|
|
|
|
|
auto it = ACTION.find(seed);
|
|
|
|
|
if(it != ACTION.end()) {
|
|
|
|
|
return it->second;
|
|
|
|
|
} else {
|
|
|
|
|
return nullptr;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
const Step *findGotoStep(int index, int non_terminator_symbol) {
|
|
|
|
|
size_t seed = 0;
|
|
|
|
|
hash_combine(seed, index);
|
|
|
|
|
hash_combine(seed, non_terminator_symbol);
|
|
|
|
|
|
|
|
|
|
auto it = GOTO.find(seed);
|
|
|
|
|
if (it != GOTO.end()) {
|
|
|
|
|
return it->second;
|
|
|
|
|
} else {
|
|
|
|
|
return nullptr;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
void print() {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
|
|
|
|
|
std::wofstream output("tables.txt");
|
|
|
|
|
|
|
|
|
|
size_t space = 4;
|
|
|
|
|
|
|
|
|
|
output << L"ACTION" << endl;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
vector<int> symbols;
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << " ";
|
2021-04-29 10:55:04 +00:00
|
|
|
|
for(const auto *symbol : pool->getAllSymbols()) {
|
|
|
|
|
if(symbol->index == 0) continue;
|
|
|
|
|
if(symbol->terminator) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
space = std::max(space, symbol->name.size() + 2);
|
2021-04-29 10:55:04 +00:00
|
|
|
|
symbols.push_back(symbol->index);
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-30 05:33:22 +00:00
|
|
|
|
|
|
|
|
|
for(const auto symbol_index : symbols) {
|
|
|
|
|
output << std::left << std::setw(space) << pool->getSymbol(symbol_index)->name;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
output << endl;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
|
|
|
|
for(int i = 0; i < icm->getItemCollections().size(); i++){
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << i;
|
2021-04-29 10:55:04 +00:00
|
|
|
|
for(int symbol : symbols) {
|
|
|
|
|
auto p_step = this->findActionStep(i, symbol);
|
|
|
|
|
if(p_step == nullptr) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << " ";
|
2021-04-25 18:24:29 +00:00
|
|
|
|
} else {
|
2021-04-29 10:55:04 +00:00
|
|
|
|
if(p_step->action == MOVE)
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << wstring(L"s") + to_wstring(p_step->target.index);
|
2021-04-29 10:55:04 +00:00
|
|
|
|
else if(p_step->action == ACC)
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << L"acc";
|
2021-04-29 12:14:20 +00:00
|
|
|
|
else if(p_step->action == STATUTE)
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << L"r" + to_wstring(p_step->target.production->index);
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << endl;
|
2021-04-29 13:56:09 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
2021-04-29 13:56:09 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << endl;
|
|
|
|
|
|
|
|
|
|
space = 4;
|
2021-04-29 13:56:09 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << "GOTO" << endl;
|
2021-04-29 13:56:09 +00:00
|
|
|
|
symbols.clear();
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << " ";
|
2021-04-29 13:56:09 +00:00
|
|
|
|
for(const auto *symbol : pool->getAllSymbols()) {
|
|
|
|
|
if(symbol->index == 0) continue;
|
|
|
|
|
if(!symbol->terminator && !symbol->start) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
space = std::max(space, symbol->name.size() + 2);
|
2021-04-29 13:56:09 +00:00
|
|
|
|
symbols.push_back(symbol->index);
|
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-30 05:33:22 +00:00
|
|
|
|
|
|
|
|
|
for(const auto symbol_index : symbols) {
|
|
|
|
|
output << std::left << std::setw(space) << pool->getSymbol(symbol_index)->name;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
output <<endl;
|
2021-04-29 13:56:09 +00:00
|
|
|
|
|
|
|
|
|
for(int k = 0; k < icm->getItemCollections().size(); k++) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << k;
|
2021-04-29 13:56:09 +00:00
|
|
|
|
for (int symbol : symbols) {
|
|
|
|
|
auto p_step = this->findGotoStep(k, symbol);
|
|
|
|
|
if(p_step == nullptr) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << " ";
|
2021-04-29 13:56:09 +00:00
|
|
|
|
} else {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << std::left << std::setw(space) << to_wstring(p_step->target.index);
|
2021-04-29 13:56:09 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << endl;
|
2021-04-29 13:56:09 +00:00
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
output << endl << endl;
|
|
|
|
|
|
|
|
|
|
output.close();
|
2021-04-29 10:55:04 +00:00
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
};
|
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
class LR0Generator{
|
2021-04-29 10:55:04 +00:00
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20>ļ<EFBFBD><C4BC><EFBFBD><EFBFBD><EFBFBD>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
wifstream input;
|
|
|
|
|
|
|
|
|
|
GrammarResourcePool *pool;
|
|
|
|
|
|
|
|
|
|
ItemCollectionManager *icm;
|
|
|
|
|
|
|
|
|
|
AnalyseTableGenerator *atg;
|
|
|
|
|
|
|
|
|
|
public:
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
LR0Generator(): input("syntaxInput.txt", std::ios::binary),
|
|
|
|
|
pool(new GrammarResourcePool()),
|
|
|
|
|
icm(new ItemCollectionManager(pool)),
|
|
|
|
|
atg(new AnalyseTableGenerator(pool, icm)){
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
auto* codeCvtToUTF8= new std::codecvt_utf8<wchar_t>;
|
|
|
|
|
|
|
|
|
|
input.imbue(std::locale(input.getloc(), codeCvtToUTF8));
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
~LR0Generator() {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
input.close();
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
void run() {
|
|
|
|
|
pool->FOLLOW();
|
|
|
|
|
icm->buildItems();
|
|
|
|
|
atg->generate();
|
|
|
|
|
atg->print();
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20>õ<EFBFBD><C3B5><EFBFBD><EFBFBD>еIJ<D0B5><C4B2><EFBFBD>ʽ
|
2021-04-29 10:55:04 +00:00
|
|
|
|
void getProductions() {
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
// <20><><EFBFBD><EFBFBD><EFBFBD>ķ<EFBFBD><C4B7>ļ<EFBFBD>
|
2021-04-29 10:55:04 +00:00
|
|
|
|
wstring temp_line;
|
|
|
|
|
|
|
|
|
|
while (getline(input, temp_line)) {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
if(temp_line.size() > 2 && temp_line[0] != '#') {
|
|
|
|
|
pool->parse_production_string_line(temp_line);
|
|
|
|
|
}
|
2021-04-24 11:53:36 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
void output(const GrammarResourcePool *&pool, const AnalyseTableGenerator *&atg) {
|
|
|
|
|
pool = this->pool;
|
|
|
|
|
atg = this->atg;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
class SyntaxParser {
|
|
|
|
|
|
|
|
|
|
// <20>ļ<EFBFBD><C4BC><EFBFBD><EFBFBD><EFBFBD>
|
|
|
|
|
wifstream input;
|
|
|
|
|
|
|
|
|
|
const GrammarResourcePool *pool;
|
|
|
|
|
|
|
|
|
|
const AnalyseTableGenerator *atg;
|
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
queue<int> token_queue;
|
|
|
|
|
|
|
|
|
|
vector<std::wstring> ws_split(const std::wstring& in, const std::wstring& delim) {
|
|
|
|
|
std::wregex re{ delim };
|
|
|
|
|
return std::vector<std::wstring> {
|
|
|
|
|
std::wsregex_token_iterator(in.begin(), in.end(), re, -1),
|
|
|
|
|
std::wsregex_token_iterator()
|
|
|
|
|
};
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
pair<wstring, wstring> get_token_info(const wstring &token) {
|
|
|
|
|
|
|
|
|
|
auto pre_index = token.find(L'(');
|
|
|
|
|
|
|
|
|
|
auto back_index = token.find(L')');
|
|
|
|
|
|
|
|
|
|
wstring name = token.substr(pre_index);
|
|
|
|
|
wstring value = token.substr(pre_index + 1, back_index - 1);
|
|
|
|
|
|
|
|
|
|
return pair<wstring, wstring>(name, value);
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public:
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
SyntaxParser(const GrammarResourcePool *pool, const AnalyseTableGenerator *atg):
|
|
|
|
|
input("outputToken.txt", std::ios::binary),
|
|
|
|
|
pool(pool),
|
|
|
|
|
atg(atg){
|
|
|
|
|
|
|
|
|
|
auto* codeCvtToUTF8= new std::codecvt_utf8<wchar_t>;
|
|
|
|
|
|
|
|
|
|
input.imbue(std::locale(input.getloc(), codeCvtToUTF8));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
~SyntaxParser() {
|
|
|
|
|
input.close();
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// <20>õ<EFBFBD><C3B5><EFBFBD><EFBFBD>еIJ<D0B5><C4B2><EFBFBD>ʽ
|
|
|
|
|
void getToken() {
|
|
|
|
|
|
|
|
|
|
// <20><><EFBFBD><EFBFBD><EFBFBD>ķ<EFBFBD><C4B7>ļ<EFBFBD>
|
|
|
|
|
wstring temp_line;
|
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
wstring line_index;
|
2021-04-30 05:33:22 +00:00
|
|
|
|
while (getline(input, temp_line)) {
|
|
|
|
|
if(temp_line.size() > 2 && temp_line[0] != '#') {
|
2021-04-30 06:07:59 +00:00
|
|
|
|
vector<wstring> tokens = ws_split(temp_line, L" ");
|
|
|
|
|
|
|
|
|
|
line_index = tokens[0];
|
|
|
|
|
|
|
|
|
|
for(int i = 1; i < tokens.size(); i++) {
|
|
|
|
|
auto token_info = get_token_info(tokens[i]);
|
|
|
|
|
}
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
2021-04-25 18:24:29 +00:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
int main() {
|
2021-04-30 05:33:22 +00:00
|
|
|
|
clock_t start,end;//<2F><><EFBFBD><EFBFBD>clock_t<5F><74><EFBFBD><EFBFBD>
|
|
|
|
|
start = clock(); //<2F><>ʼʱ<CABC><CAB1>
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
const GrammarResourcePool *pool;
|
|
|
|
|
|
|
|
|
|
const AnalyseTableGenerator *atg;
|
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
|
2021-04-30 06:07:59 +00:00
|
|
|
|
LR0Generator generator;
|
2021-04-25 18:24:29 +00:00
|
|
|
|
|
|
|
|
|
generator.getProductions();
|
|
|
|
|
|
2021-04-29 10:55:04 +00:00
|
|
|
|
generator.run();
|
2021-04-30 06:07:59 +00:00
|
|
|
|
|
|
|
|
|
generator.output(pool, atg);
|
|
|
|
|
|
2021-04-30 05:33:22 +00:00
|
|
|
|
//<2F><><EFBFBD><EFBFBD>ʱ<EFBFBD><CAB1>
|
|
|
|
|
end = clock(); //<2F><><EFBFBD><EFBFBD>ʱ<EFBFBD><CAB1>
|
2021-04-24 11:53:36 +00:00
|
|
|
|
double times = double(end-start)/CLOCKS_PER_SEC;
|
|
|
|
|
cout<<"The Run time = "<<times<<"s" << " = " <<times * 1000 <<"ms" << endl;
|
2021-04-30 06:07:59 +00:00
|
|
|
|
|
|
|
|
|
SyntaxParser syntaxParser(pool, atg);
|
|
|
|
|
|
|
|
|
|
syntaxParser.getToken();
|
|
|
|
|
|
2021-04-24 11:53:36 +00:00
|
|
|
|
return 0;
|
|
|
|
|
}
|
|
|
|
|
|