158 lines
5.7 KiB
C++
158 lines
5.7 KiB
C++
#pragma once
|
|
#ifndef PARSODUS_LRTABLES_GENERATOR_H_YW3GIUNH
|
|
#define PARSODUS_LRTABLES_GENERATOR_H_YW3GIUNH
|
|
|
|
#include "Parsodus/grammar.h"
|
|
#include "Parsodus/util/symbols.h"
|
|
#include "Parsodus/lrtables/table.h"
|
|
|
|
#include <algorithm>
|
|
#include <cassert>
|
|
#include <memory>
|
|
#include <queue>
|
|
|
|
namespace pds {
|
|
namespace lr {
|
|
|
|
/**
|
|
* Base class for LR (and derivative) table generators (such as SLR and LALR)
|
|
* Parametrized on the type of itemset (configuration set) to be used
|
|
*
|
|
* An Itemset should support:
|
|
* - A constructor taking a single Rule, that makes this a starting rule
|
|
* - void close(const Grammar&); compute the closure
|
|
* - Itemset succ(std::string) const; compute the successor of this set, over the given symbol
|
|
* - bool operator==(const Itemset&); are these two Itemsets equal
|
|
* - bool canMerge(const Itemset&) const; Can the given Itemset be merged into this one
|
|
* - bool merge(const Itemset&); Merge the given Itemset into this one, return whether there was a change
|
|
* - bool empty() const; is this Itemset empty (== not useful)
|
|
* - std::set<std::size_t> getReduces(const Grammar&, std::string) const; get all Rule indices where a reduce should happen with given lookahead (not necessarily a set, but iterable)
|
|
* - static bool needsFollow() const; does this type of Itemset need Follow sets to work, if so the first and follow unique_ptr's of the grammar passed will be initialized
|
|
*/
|
|
template <typename Itemset>
|
|
class Generator {
|
|
public:
|
|
/**
|
|
* Constructor
|
|
*
|
|
* @param start The start symbol for the grammar
|
|
* @param g The grammar to translate
|
|
*/
|
|
Generator(const Grammar& g);
|
|
|
|
/**
|
|
* Generate an LRTable based on given grammar
|
|
*
|
|
* @returns An LR (or derivative) table for the grammar given at construction
|
|
*/
|
|
LRTable generate();
|
|
|
|
private:
|
|
Grammar m_gram;
|
|
std::shared_ptr<Rule> m_startrule;
|
|
};
|
|
|
|
template <typename Itemset>
|
|
Generator<Itemset>::Generator(const Grammar& g) : m_gram(g), m_startrule(std::make_shared<Rule>(util::EXTENDED_START, std::vector<std::string>{g.start})) {
|
|
m_gram.terminals.insert(util::EOF_PLACEHOLDER); //End of file
|
|
m_gram.variables.insert(util::EXTENDED_START); //modified start rule
|
|
m_gram.rules.push_back(m_startrule);
|
|
if (Itemset::needsFollow()) {
|
|
m_gram.first = std::make_unique<util::FirstSet>(m_gram);
|
|
m_gram.follow = std::make_unique<util::FollowSet>(m_gram, *m_gram.first);
|
|
}
|
|
}
|
|
|
|
template <typename Itemset>
|
|
LRTable Generator<Itemset>::generate() {
|
|
LRTable table;
|
|
|
|
//Start with size 1
|
|
table.act.emplace_back();
|
|
table.goto_.emplace_back();
|
|
|
|
std::vector<Itemset> itemsets;
|
|
itemsets.emplace_back(Itemset(m_startrule));
|
|
itemsets[0].close(m_gram);
|
|
|
|
std::set<std::string> symbols;
|
|
std::set_union(m_gram.terminals.begin(), m_gram.terminals.end(),
|
|
m_gram.variables.begin(), m_gram.variables.end(),
|
|
std::inserter(symbols, symbols.end()));
|
|
|
|
std::queue<std::pair<std::size_t, Itemset>> q;
|
|
q.emplace(0, itemsets[0]);
|
|
while (!q.empty()) {
|
|
auto& curP = q.front();
|
|
std::size_t curIdx = curP.first;
|
|
Itemset cur = curP.second;
|
|
q.pop();
|
|
|
|
for (const std::string& sym : symbols) {
|
|
Itemset s = cur.succ(sym);
|
|
if (s.empty())
|
|
continue;
|
|
s.close(m_gram);
|
|
|
|
std::size_t idx;
|
|
for (idx = 0; idx < itemsets.size(); idx++) {
|
|
if (itemsets[idx] == s) {
|
|
break;
|
|
} else if (itemsets[idx].canMerge(s)) {
|
|
if (itemsets[idx].merge(s)) {
|
|
q.emplace(idx, std::move(s));
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
if (idx == itemsets.size()) {
|
|
q.emplace(idx, s);
|
|
itemsets.emplace_back(std::move(s));
|
|
|
|
//Grow the table
|
|
table.act.emplace_back();
|
|
table.goto_.emplace_back();
|
|
}
|
|
|
|
if (m_gram.variables.count(sym)) {
|
|
table.goto_[curIdx][sym] = idx;
|
|
} else {
|
|
table.act[curIdx][sym] = std::make_pair(Action::SHIFT, idx);
|
|
}
|
|
|
|
}
|
|
|
|
for (std::string term : m_gram.terminals) {
|
|
//Get reduces from the itemset, add them to the table, look for conflicts
|
|
for (std::size_t rule_applied : cur.getReduces(m_gram, term)) {
|
|
if (rule_applied == m_gram.rules.size() - 1) { // The last added rule
|
|
// The extended start rule
|
|
if (term == util::EOF_PLACEHOLDER)
|
|
table.act[curIdx][term] = std::make_pair(Action::ACCEPT, 0);
|
|
} else if (table.act[curIdx].count(term)) {
|
|
if (table.act[curIdx][term].first == Action::SHIFT) {
|
|
//Shift-Reduce conflict, rapport and resolve it (TODO)
|
|
throw std::runtime_error("shift-reduce");
|
|
} else if (table.act[curIdx][term].first == Action::REDUCE
|
|
&& table.act[curIdx][term].second != rule_applied) {
|
|
//Reduce-Reduce conflict, rapport it (TODO)
|
|
throw std::runtime_error("reduce-reduce");
|
|
} else {
|
|
//Reduce using the same rule, no problem, NO-OP
|
|
}
|
|
} else {
|
|
// No conflicts
|
|
table.act[curIdx][term] = std::make_pair(Action::REDUCE, rule_applied);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return table;
|
|
}
|
|
|
|
} /* lr */
|
|
} /* pdf */
|
|
|
|
#endif /* PARSODUS_LRTABLES_GENERATOR_H_YW3GIUNH */
|