Skip to content

Commit

Permalink
Expanded documentation of PowersetConverter and related types/functions.
Browse files Browse the repository at this point in the history
  • Loading branch information
zezax committed Nov 5, 2023
1 parent be4c4b6 commit ab04b2d
Show file tree
Hide file tree
Showing 2 changed files with 19 additions and 3 deletions.
13 changes: 11 additions & 2 deletions quol/red/include/Powerset.h
Original file line number Diff line number Diff line change
Expand Up @@ -45,17 +45,26 @@

namespace zezax::red {

// This is a mapping from a distinct multi-char to a set of NFA state IDs.
// All the distinct multi-chars are put in an array at the start. The
// index into that array becomes the index into this sparse array.
typedef SparseVec<NfaIdSet> IdxToNfaIdSet;

// sometimes called translation or transition table...
// This is sometimes called the translation or transition table. It maps
// sets of NFA states to the mapping described above.
typedef std::unordered_map<NfaIdSet, IdxToNfaIdSet> NfaStatesToTransitions;

// Here we keep track of how many times each accepting state occurs in
// the translation table. This is used as a tie-breaker when multiple
// accepting results are possible; the lowest number wins.
typedef std::unordered_map<NfaId, size_t> NfaIdToCount;

// NfaStatesToId keeps the mapping from sets of NFA states to the
// corresponding DFA state, by ID. Final conversion uses this.
typedef std::unordered_map<NfaIdSet, DfaId> NfaStatesToId;


// converts nfa to dfa via rabin-scott
// Main class that converts NFA to DFA via Rabin-Scott
class PowersetConverter {
public:
explicit PowersetConverter(const NfaObj &input,
Expand Down
9 changes: 8 additions & 1 deletion quol/red/lib/Powerset.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -39,6 +39,7 @@ using std::vector;

namespace {

// Picks the best from a set of NFA states, or -1 if no acceptances
Result getResult(const NfaIdSet &nis,
const NfaIdToCount &counts,
const NfaObj &nfa) {
Expand All @@ -63,6 +64,7 @@ Result getResult(const NfaIdSet &nis,

///////////////////////////////////////////////////////////////////////////////

// The main driver function for the NFA to DFA conversion
DfaObj PowersetConverter::convert() {
if (stats_)
stats_->preDfa_ = std::chrono::steady_clock::now();
Expand Down Expand Up @@ -116,6 +118,7 @@ DfaObj PowersetConverter::convert() {
}


// Doorway function to recursive transcription to final DFA
DfaId PowersetConverter::dfaFromNfa(const std::vector<MultiChar> &multiChars,
const NfaStatesToTransitions &table,
const NfaIdToCount &counts,
Expand Down Expand Up @@ -172,7 +175,9 @@ MultiCharSet basisMultiChars(const MultiCharSet &mcs) {
}


// this is a performace-critical function
// Make the translation table that the entire conversion process depends
// on. Map sets of NFA states to maps from multi-chars to NFA state sets.
// This is a performace-critical function.
NfaStatesToTransitions makeTable(NfaId initial,
const NfaObj &nfa,
const vector<MultiChar> &allMultiChars) {
Expand Down Expand Up @@ -212,6 +217,7 @@ NfaStatesToTransitions makeTable(NfaId initial,
}


// Sum all the occurrences of each accepting state in the translation table
NfaIdToCount countAcceptingStates(const NfaStatesToTransitions &table,
const NfaObj &nfa) {
NfaIdToCount rv;
Expand All @@ -225,6 +231,7 @@ NfaIdToCount countAcceptingStates(const NfaStatesToTransitions &table,
}


// The real work of building the DFA from the translation table, counts, etc.
DfaId dfaFromNfaRecurse(const vector<MultiChar> &multiChars,
const NfaStatesToTransitions &table,
const NfaIdToCount &counts,
Expand Down

0 comments on commit ab04b2d

Please sign in to comment.