diff options
author | Bruce He <44327446+zm2he@users.noreply.github.com> | 2023-07-19 21:52:55 +0000 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-07-19 17:52:55 -0400 |
commit | f61bf9f46addc0b6885b60b3e0f1c4ccc7e64473 (patch) | |
tree | 92dd1216ad6d3982e0f51f797b3030f8dea2ee25 /src/analysis/reaching-definitions-transfer-function.h | |
parent | a15d71f5fb4f3488e8a25071cb8813fe6045290e (diff) | |
download | binaryen-f61bf9f46addc0b6885b60b3e0f1c4ccc7e64473.tar.gz binaryen-f61bf9f46addc0b6885b60b3e0f1c4ccc7e64473.tar.bz2 binaryen-f61bf9f46addc0b6885b60b3e0f1c4ccc7e64473.zip |
Reaching Definitions Analysis for LocalGraph (#5817)
This change implements a reaching definitions analysis which is intended
to be equivalent to the information provided by LocalGraph, specifically
the Flower class of LocalGraph.
It also introduces a CRTP utility in visitor-transfer-function.h which
implements most commonly found visitor-type transfer function
functionalities. The MonotoneCFGAnalyzer is also modified to add a phase
to collect results after the analysis is solved from the final CFG
states.
Diffstat (limited to 'src/analysis/reaching-definitions-transfer-function.h')
-rw-r--r-- | src/analysis/reaching-definitions-transfer-function.h | 178 |
1 files changed, 178 insertions, 0 deletions
diff --git a/src/analysis/reaching-definitions-transfer-function.h b/src/analysis/reaching-definitions-transfer-function.h new file mode 100644 index 000000000..8d29afd12 --- /dev/null +++ b/src/analysis/reaching-definitions-transfer-function.h @@ -0,0 +1,178 @@ +#ifndef wasm_analysis_reaching_definitions_transfer_function_h +#define wasm_analysis_reaching_definitions_transfer_function_h + +#include "ir/find_all.h" +#include "ir/local-graph.h" +#include "visitor-transfer-function.h" + +namespace wasm::analysis { + +// A state contains all the "live" LocalSet instances at some particular +// point in a program. The state tracks every LocalSet instance, not just +// ones which influence a particular local index. + +// In addition to LocalSet expressions modifying a local index's value, we +// must also account for the fact that the value of a local index could be +// the default value at initialization or its value passed in as a parameter. +// As a result, we use a fictitious LocalSet object held by the transfer +// function to represent the local index obtaining its current value on +// initialization or parameter passing. + +// Each local index gets an individual fictitious LocalSet, because the state +// tracks all local indices, and setting one local index should not affect the +// initial value of another. + +// When collecting results, the transfer function takes the states and converts +// it into a map of LocalGets to LocalSets which affect it. The fictitious +// inital value LocalSetes will be converted to nullptrs. + +class ReachingDefinitionsTransferFunction + : public VisitorTransferFunc<ReachingDefinitionsTransferFunction, + FinitePowersetLattice<LocalSet*>, + AnalysisDirection::Forward> { + + // Number of locals in the function. + size_t numLocals; + + // Maps a local index to a list of LocalSets that modify the index's value. + // The most common case is to have a single set; after that, to be a phi of 2 + // items, so we use a small set of size 2 to avoid allocations there. + std::unordered_map<Index, SmallVector<LocalSet*, 2>> indexSetses; + + // LocalGraph members we need to update. + LocalGraph::GetSetses& getSetses; + + // Fictitious LocalSet objects to reprsent a local index obtaining its value + // from its default initial value or parameter value. + std::vector<LocalSet> fakeInitialValueSetses; + + // Pointers to the fictitious LocalSet objects. + std::unordered_set<LocalSet*> fakeSetPtrs; + + // Helper function which creates fictitious LocalSetses for a function, + // inserts them into fakeInitialValueSetses and fakeSetPtrs. It returns a + // vector of actual LocalSetses in the function and fictitious LocalSetses for + // use when instatitating the lattice. + static std::vector<LocalSet*> + listLocalSetses(Function* func, + std::vector<LocalSet>& fakeInitialValueSetses, + std::unordered_set<LocalSet*>& fakeSetPtrs) { + // Create a fictitious LocalSet for each local index. + for (Index i = 0; i < func->getNumLocals(); ++i) { + LocalSet currSet; + currSet.index = i; + fakeInitialValueSetses.push_back(currSet); + } + + // Find all actual LocalSetses. + FindAll<LocalSet> setFinder(func->body); + std::vector<LocalSet*> setsesList = std::move(setFinder.list); + + // Take a pointer for each fictitious LocalSet. + for (size_t i = 0; i < fakeInitialValueSetses.size(); ++i) { + setsesList.push_back(&fakeInitialValueSetses[i]); + fakeSetPtrs.insert(&fakeInitialValueSetses[i]); + } + return setsesList; + } + +public: + // Analysis lattice. Public, as the monotone analyzer may need it. + FinitePowersetLattice<LocalSet*> lattice; + + // We actually don't update LocalGraph::Locations right now since the CFG we + // are working with doesn't contain the correct Expression**s, but this is + // left in for future improvements. TODO. + ReachingDefinitionsTransferFunction(Function* func, + LocalGraph::GetSetses& getSetses, + LocalGraph::Locations& locations) + : numLocals(func->getNumLocals()), getSetses(getSetses), + lattice(listLocalSetses(func, fakeInitialValueSetses, fakeSetPtrs)) { + + // Map every local index to a set of all the local sets which affect it. + for (auto it = lattice.membersBegin(); it != lattice.membersEnd(); ++it) { + indexSetses[(*it)->index].push_back(*it); + } + } + + void visitLocalSet(LocalSet* curr) { + assert(currState); + + // This is only needed to derive states when solving the analysis, and + // not for collecting results from the final states. + + // For a LocalSet, we remove all previous setses modifying its index and + // adds itself. + auto& currSetses = indexSetses[curr->index]; + for (auto setInstance : currSetses) { + lattice.remove(currState, setInstance); + } + + lattice.add(currState, curr); + } + + // Only for collecting results. For curr, collects all of the sets to curr's + // index which are present in the state (i.e. those that set index's current + // value). + void visitLocalGet(LocalGet* curr) { + assert(currState); + + // This is only to be run in the second phase where we iterate over the + // final (i.e. solved) states. Thus, only done when collectingResults is + // true. + if (collectingResults) { + auto& matchingSetses = indexSetses[curr->index]; + + for (auto setInstance : matchingSetses) { + if (lattice.exists(currState, setInstance)) { + // If a pointer to a real LocalSet, add it, otherwise add a nullptr. + if (fakeSetPtrs.find(setInstance) == fakeSetPtrs.end()) { + getSetses[curr].insert(setInstance); + } else { + getSetses[curr].insert(nullptr); + } + } + } + } + } + + // At the entry point of the function, we must set the state to signify that + // the values in each local index are from either a parameter value or their + // default initialized value. This cannot be done normally, because the + // initial state of the entry block is initialized as the bottom element, but + // no one can modify it because this block doesn't depend on any other. Hence + // the need for this function. + void + evaluateFunctionEntry(Function* func, + FinitePowersetLattice<LocalSet*>::Element& inputState) { + for (auto currSet : fakeSetPtrs) { + lattice.add(&inputState, currSet); + } + } + + void print(std::ostream& os, + const BasicBlock* cfgBlock, + FinitePowersetLattice<LocalSet*>::Element& inputState) { + os << "Intermediate States: " << std::endl; + currState = &inputState; + currState->print(os); + os << std::endl; + auto cfgIter = cfgBlock->begin(); + + // Since we don't store the intermediate states, we need to re-run the + // transfer function on all the CFG node expressions to reconstruct + // the intermediate states here. + while (cfgIter != cfgBlock->end()) { + os << ShallowExpression{*cfgIter} << std::endl; + visit(*cfgIter); + currState->print(os); + os << std::endl; + ++cfgIter; + } + currState = nullptr; + } +}; + +} // namespace wasm::analysis + +#endif // wasm_analysis_reaching_definitions_transfer_function_h |