summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorAlon Zakai <azakai@google.com>2023-10-31 08:30:50 -0700
committerGitHub <noreply@github.com>2023-10-31 08:30:50 -0700
commitfad0698907a5a8e77ed3b2c30a4b832e575f65e0 (patch)
tree5773c0cd902e84cb4c3c6e8ddfeb2e9033167590 /src
parent68ba799661506160445dbe54f188b29494423964 (diff)
downloadbinaryen-fad0698907a5a8e77ed3b2c30a4b832e575f65e0.tar.gz
binaryen-fad0698907a5a8e77ed3b2c30a4b832e575f65e0.tar.bz2
binaryen-fad0698907a5a8e77ed3b2c30a4b832e575f65e0.zip
OnceReduction: Optimize bodies of trivial "once" functions (#6061)
In particular, if the body just calls another "once" function, then we can skip the early-exit logic.
Diffstat (limited to 'src')
-rw-r--r--src/passes/OnceReduction.cpp122
1 files changed, 112 insertions, 10 deletions
diff --git a/src/passes/OnceReduction.cpp b/src/passes/OnceReduction.cpp
index c1500f185..d97e19302 100644
--- a/src/passes/OnceReduction.cpp
+++ b/src/passes/OnceReduction.cpp
@@ -197,9 +197,10 @@ private:
OptInfo& optInfo;
};
-// Information in a basic block. We track relevant expressions, which are calls
-// calls to "once" functions, and writes to "once" globals.
+// Information in a basic block.
struct BlockInfo {
+ // We track relevant expressions, which are call to "once" functions, and
+ // writes to "once" globals.
std::vector<Expression*> exprs;
};
@@ -312,18 +313,16 @@ struct Optimizer
optimizeOnce(set->name);
}
} else if (auto* call = expr->dynCast<Call>()) {
- if (optInfo.onceFuncs.at(call->target).is()) {
+ auto target = call->target;
+ if (optInfo.onceFuncs.at(target).is()) {
// The global used by the "once" func is written.
assert(call->operands.empty());
- optimizeOnce(optInfo.onceFuncs.at(call->target));
+ optimizeOnce(optInfo.onceFuncs.at(target));
continue;
}
- // This is not a call to a "once" func. However, we may have inferred
- // that it definitely sets some "once" globals before it returns, and
- // we can use that information.
- for (auto globalName :
- optInfo.onceGlobalsSetInFuncs.at(call->target)) {
+ // Note as written all globals the called function is known to write.
+ for (auto globalName : optInfo.onceGlobalsSetInFuncs.at(target)) {
onceGlobalsWritten.insert(globalName);
}
} else {
@@ -439,7 +438,110 @@ struct OnceReduction : public Pass {
lastOnceGlobalsSet = currOnceGlobalsSet;
continue;
}
- return;
+ break;
+ }
+
+ // Finally, apply some optimizations to "once" functions themselves. We do
+ // this at the end to not modify them as we go, which could confuse the main
+ // part of this pass right before us.
+ optimizeOnceBodies(optInfo, module);
+ }
+
+ void optimizeOnceBodies(const OptInfo& optInfo, Module* module) {
+ // Track which "once" functions we remove the exit logic from, as we cannot
+ // create loops without exit logic, see below.
+ std::unordered_set<Name> removedExitLogic;
+
+ // Iterate deterministically on functions, as the order matters (since we
+ // make decisions based on previous actions; see below).
+ for (auto& func : module->functions) {
+ if (!optInfo.onceFuncs.at(func->name).is()) {
+ // This is not a "once" function.
+ continue;
+ }
+
+ // We optimize the case where the payload is trivial, that is where we
+ // have this:
+ //
+ // function foo() {
+ // if (!foo$once) return; // two lines of
+ // foo$once = 1; // early-exit code
+ // PAYLOAD
+ // }
+ //
+ // And PAYLOAD is simple.
+ auto* body = func->body;
+ auto& list = body->cast<Block>()->list;
+ if (list.size() == 2) {
+ // No payload at all; we don't need the early-exit code then.
+ //
+ // Note that this overlaps with SimplifyGlobals' optimization on
+ // "read-only-to-write" globals: with no payload, this global is really
+ // only read in order to write itself, and nothing more, so there is no
+ // observable behavior we need to preserve, and the global can be
+ // removed. We might as well handle this case here as well since we've
+ // done all the work up to here, and it is just one line to implement
+ // the nopping out. (And doing so here can accelerate the optimization
+ // pipeline by not needing to wait until the next SimplifyGlobals.)
+ ExpressionManipulator::nop(body);
+ continue;
+ }
+ if (list.size() != 3) {
+ // Something non-trivial; too many items for us to consider.
+ continue;
+ }
+ auto* payload = list[2];
+ if (auto* call = payload->dynCast<Call>()) {
+ if (optInfo.onceFuncs.at(call->target).is()) {
+ // All this "once" function does is call another. We do not need the
+ // early-exit logic in this one, then, because of the following
+ // reasoning. We are comparing these forms:
+ //
+ // // BEFORE
+ // function foo() {
+ // if (!foo$once) return; // two lines of
+ // foo$once = 1; // early-exit code
+ // bar();
+ // }
+ //
+ // to
+ //
+ // // AFTER
+ // function foo() {
+ // bar();
+ // }
+ //
+ // The question is whether different behavior can be observed between
+ // those two. There are two cases, when we enter foo:
+ //
+ // 1. foo has been called before. Then we early-exit in BEFORE, and
+ // in AFTER we call bar which will early-exit (since foo was
+ // called, which means bar was at least entered, which set its
+ // global; bar might be on the stack, if it called foo, so it has
+ // not necessarily fully executed - this is a tricky situation to
+ // handle in general, like recursive imports of modules in various
+ // languages - but we do know bar has been *entered*, which means
+ // the global was set).
+ // 2. foo has never been called before. In this case in BEFORE we set
+ // the global and call bar, and in AFTER we also call bar.
+ //
+ // Thus, the behavior is the same, and we can remove the early-exit
+ // lines.
+ //
+ // We must be careful of loops, however: If A calls B and B calls A,
+ // then at least one must keep the early-exit logic, or else they
+ // would infinitely loop if one is called. To avoid that, we track
+ // which functions we remove the early-exit logic from, and never
+ // remove the logic if we are calling such a function. (As a result,
+ // the order of iteration matters here, and so the outer loop in this
+ // function must be deterministic.)
+ if (!removedExitLogic.count(call->target)) {
+ ExpressionManipulator::nop(list[0]);
+ ExpressionManipulator::nop(list[1]);
+ removedExitLogic.insert(func->name);
+ }
+ }
+ }
}
}
};