diff options
author | Alon Zakai <alonzakai@gmail.com> | 2018-11-14 13:11:05 -0800 |
---|---|---|
committer | GitHub <noreply@github.com> | 2018-11-14 13:11:05 -0800 |
commit | b79f3a48140e99ac917274bfd680217fe28ae17c (patch) | |
tree | 25c59bfdc659149a79035198994a7e1d2d394b3e /src/ir/utils.h | |
parent | 7e9f7f62d230f7ed083c0c2d425ae47dac4f513f (diff) | |
download | binaryen-b79f3a48140e99ac917274bfd680217fe28ae17c.tar.gz binaryen-b79f3a48140e99ac917274bfd680217fe28ae17c.tar.bz2 binaryen-b79f3a48140e99ac917274bfd680217fe28ae17c.zip |
ReFinalize fix (#1742)
Handle a corner case in ReFinalize, which incrementally re-types code after changes. The problem is that if we need to figure out the type of a block, we look to the last element flowing out, or to breaks with values. If there is no such last element, and the breaks are not taken - they have unreachable values - then they don't tell us the block's proper type. We asserted that in such a case the block still had a type, and didn't handle this.
To fix it, we could look on the parent to see what type would fit. However, it seem simpler to just remove untaken breaks/switches as part of ReFinalization - they carry no useful info anyhow. After removing them, if the block has no other signal of a concrete type, it can just be unreachable.
This bug existed for at least 1.5 years - I didn't look back further. I think it was noticed by the fuzzer now due to recent fuzzing improvements and optimizer improvements, as I just saw this bug found a second time.
Diffstat (limited to 'src/ir/utils.h')
-rw-r--r-- | src/ir/utils.h | 66 |
1 files changed, 52 insertions, 14 deletions
diff --git a/src/ir/utils.h b/src/ir/utils.h index 5eff0a52d..446e2c24a 100644 --- a/src/ir/utils.h +++ b/src/ir/utils.h @@ -83,13 +83,23 @@ struct ExpressionAnalyzer { static uint32_t hash(Expression* curr); }; -// Re-Finalizes all node types +// Re-Finalizes all node types. This can be run after code was modified in +// various ways that require propagating types around, and it does such an +// "incremental" update. This is done under the assumption that there is +// a valid assignment of types to apply. // This removes "unnecessary' block/if/loop types, i.e., that are added // specifically, as in // (block (result i32) (unreachable)) // vs // (block (unreachable)) // This converts to the latter form. +// This also removes un-taken branches that would be a problem for +// refinalization: if a block has been marked unreachable, and has +// branches to it with values of type unreachable, then we don't +// know the type for the block: it can't be none since the breaks +// exist, but the breaks don't declare the type, rather everything +// depends on the block. To avoid looking at the parent or something +// else, just remove such un-taken branches. struct ReFinalize : public WalkerPass<PostWalker<ReFinalize, OverriddenVisitor<ReFinalize>>> { bool isFunctionParallel() override { return true; } @@ -108,7 +118,6 @@ struct ReFinalize : public WalkerPass<PostWalker<ReFinalize, OverriddenVisitor<R return; } // do this quickly, without any validation - auto old = curr->type; // last element determines type curr->type = curr->list.back()->type; // if concrete, it doesn't matter if we have an unreachable child, and we @@ -121,14 +130,8 @@ struct ReFinalize : public WalkerPass<PostWalker<ReFinalize, OverriddenVisitor<R if (iter != breakValues.end()) { // there is a break to here auto type = iter->second; - if (type == unreachable) { - // all we have are breaks with values of type unreachable, and no - // concrete fallthrough either. we must have had an existing type, then - curr->type = old; - assert(isConcreteType(curr->type)); - } else { - curr->type = type; - } + assert(type != unreachable); // we would have removed such branches + curr->type = type; return; } } @@ -147,15 +150,24 @@ struct ReFinalize : public WalkerPass<PostWalker<ReFinalize, OverriddenVisitor<R void visitLoop(Loop* curr) { curr->finalize(); } void visitBreak(Break* curr) { curr->finalize(); - updateBreakValueType(curr->name, getValueType(curr->value)); + auto valueType = getValueType(curr->value); + if (valueType == unreachable) { + replaceUntaken(curr->value, curr->condition); + } else { + updateBreakValueType(curr->name, valueType); + } } void visitSwitch(Switch* curr) { curr->finalize(); auto valueType = getValueType(curr->value); - for (auto target : curr->targets) { - updateBreakValueType(target, valueType); + if (valueType == unreachable) { + replaceUntaken(curr->value, curr->condition); + } else { + for (auto target : curr->targets) { + updateBreakValueType(target, valueType); + } + updateBreakValueType(curr->default_, valueType); } - updateBreakValueType(curr->default_, valueType); } void visitCall(Call* curr) { curr->finalize(); } void visitCallIndirect(CallIndirect* curr) { curr->finalize(); } @@ -195,6 +207,7 @@ struct ReFinalize : public WalkerPass<PostWalker<ReFinalize, OverriddenVisitor<R void visitMemory(Memory* curr) { WASM_UNREACHABLE(); } void visitModule(Module* curr) { WASM_UNREACHABLE(); } +private: Type getValueType(Expression* value) { return value ? value->type : none; } @@ -204,6 +217,31 @@ struct ReFinalize : public WalkerPass<PostWalker<ReFinalize, OverriddenVisitor<R breakValues[name] = type; } } + + // Replace an untaken branch/switch with an unreachable value. + // A condition may also exist and may or may not be unreachable. + void replaceUntaken(Expression* value, Expression* condition) { + assert(value->type == unreachable); + auto* replacement = value; + if (condition) { + Builder builder(*getModule()); + // Even if we have + // (block + // (unreachable) + // (i32.const 1) + // ) + // we want the block type to be unreachable. That is valid as + // the value is unreachable, and necessary since the type of + // the condition did not have an impact before (the break/switch + // type was unreachable), and might not fit in. + if (isConcreteType(condition->type)) { + condition = builder.makeDrop(condition); + } + replacement = builder.makeSequence(value, condition); + assert(replacement->type); + } + replaceCurrent(replacement); + } }; // Re-finalize a single node. This is slow, if you want to refinalize |