| /* |
| * Copyright (C) 2016 Apple Inc. All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in the |
| * documentation and/or other materials provided with the distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY |
| * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
| * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR |
| * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
| * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #include "config.h" |
| #include "B3InferSwitches.h" |
| |
| #if ENABLE(B3_JIT) |
| |
| #include "B3BasicBlockInlines.h" |
| #include "B3CaseCollectionInlines.h" |
| #include "B3InsertionSetInlines.h" |
| #include "B3PhaseScope.h" |
| #include "B3ProcedureInlines.h" |
| #include "B3SwitchValue.h" |
| #include "B3UseCounts.h" |
| #include "B3ValueInlines.h" |
| #include <wtf/ListDump.h> |
| |
| namespace JSC { namespace B3 { |
| |
| namespace { |
| |
| namespace B3InferSwitchesInternal { |
| static const bool verbose = false; |
| } |
| |
| class InferSwitches { |
| public: |
| InferSwitches(Procedure& proc) |
| : m_proc(proc) |
| , m_insertionSet(proc) |
| , m_useCounts(proc) |
| { |
| } |
| |
| bool run() |
| { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog("B3 before inferSwitches:\n", m_proc); |
| |
| bool changed = true; |
| bool everChanged = false; |
| while (changed) { |
| changed = false; |
| |
| if (B3InferSwitchesInternal::verbose) |
| dataLog("Performing fixpoint iteration:\n"); |
| |
| for (BasicBlock* block : m_proc) |
| changed |= attemptToMergeWithPredecessor(block); |
| |
| everChanged |= changed; |
| } |
| |
| if (everChanged) { |
| m_proc.resetReachability(); |
| m_proc.invalidateCFG(); |
| |
| m_proc.deleteOrphans(); |
| |
| if (B3InferSwitchesInternal::verbose) |
| dataLog("B3 after inferSwitches:\n", m_proc); |
| return true; |
| } |
| |
| return false; |
| } |
| |
| private: |
| bool attemptToMergeWithPredecessor(BasicBlock* block) |
| { |
| // No point in considering the root block. We also don't consider blocks with multiple |
| // predecessors, but we could handle this if we made this code a bit more general and we were |
| // not afraid of code bloat. |
| if (block->numPredecessors() != 1) |
| return false; |
| |
| SwitchDescription description = describe(block); |
| if (B3InferSwitchesInternal::verbose) |
| dataLog("Description of primary block ", *block, ": ", description, "\n"); |
| if (!description) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because not switch-like.\n"); |
| return false; |
| } |
| |
| // We know that this block behaves like a switch. But we need to verify that it doesn't also |
| // perform any effects or do expensive things. We don't want to create a switch if that will |
| // make expensive things execute unconditionally. We're very conservative about how we define |
| // "expensive". |
| for (Value* value : *block) { |
| if (value->isFree()) |
| continue; |
| if (value == description.extra) |
| continue; |
| if (value == description.branch) |
| continue; |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because of ", deepDump(m_proc, value), "\n"); |
| return false; |
| } |
| |
| BasicBlock* predecessor = block->predecessor(0); |
| SwitchDescription predecessorDescription = describe(predecessor); |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Description of predecessor block ", *predecessor, ": ", predecessorDescription, "\n"); |
| if (!predecessorDescription) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because not switch-like.\n"); |
| return false; |
| } |
| |
| // Both us and the predecessor are switch-like, but that doesn't mean that we're compatible. |
| // We may be switching on different values! |
| if (description.source != predecessorDescription.source) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because sources don't match.\n"); |
| return false; |
| } |
| |
| // We expect that we are the fall-through destination of the predecessor. This is a bit of a |
| // goofy condition. If we were not the fall-through destination then our switch is probably |
| // just totally redundant and we should be getting rid of it. But we don't handle that here, |
| // yet. |
| if (predecessorDescription.fallThrough.block() != block) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because fall-through of predecessor is not the primary block.\n"); |
| return false; |
| } |
| |
| // Make sure that there ain't no loops. |
| if (description.fallThrough.block() == block |
| || description.fallThrough.block() == predecessor) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because of fall-through loop.\n"); |
| return false; |
| } |
| for (SwitchCase switchCase : description.cases) { |
| if (switchCase.targetBlock() == block |
| || switchCase.targetBlock() == predecessor) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because of loop in primary cases.\n"); |
| return false; |
| } |
| } |
| for (SwitchCase switchCase : predecessorDescription.cases) { |
| if (switchCase.targetBlock() == block |
| || switchCase.targetBlock() == predecessor) { |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Bailing because of loop in predecessor cases.\n"); |
| return false; |
| } |
| } |
| |
| if (B3InferSwitchesInternal::verbose) |
| dataLog(" Doing it!\n"); |
| // We're committed to doing the thing. |
| |
| // Delete the extra value from the predecessor, since that would break downstream inference |
| // on the next fixpoint iteration. We would think that this block is too expensive to merge |
| // because of the Equal or NotEqual value even though that value is dead! We know it's dead |
| // so we kill it ourselves. |
| for (Value* value : *predecessor) { |
| if (value == predecessorDescription.extra) |
| value->replaceWithNopIgnoringType(); |
| } |
| |
| // Insert all non-terminal values from our block into our predecessor. We definitely need to |
| // do this for constants. We must not do it for the extra value, since that would break |
| // downstream inference on the next fixpoint iteration. As a bonus, we don't do it for nops, |
| // so that we limit how big blocks get in this phase. |
| for (unsigned i = 0; i < block->size() - 1; ++i) { |
| Value* value = block->at(i); |
| if (value != description.extra && value->opcode() != Nop) |
| m_insertionSet.insertValue(predecessor->size() - 1, value); |
| } |
| m_insertionSet.execute(predecessor); |
| block->values().shrink(0); |
| block->appendNew<Value>(m_proc, Oops, description.branch->origin()); |
| block->removePredecessor(predecessor); |
| |
| for (BasicBlock* successorBlock : description.block->successorBlocks()) |
| successorBlock->replacePredecessor(block, predecessor); |
| |
| block->clearSuccessors(); |
| |
| SwitchValue* switchValue = predecessor->replaceLastWithNew<SwitchValue>( |
| m_proc, predecessor->last()->origin(), description.source); |
| predecessor->clearSuccessors(); |
| switchValue->setFallThrough(description.fallThrough); |
| |
| Vector<int64_t> predecessorCases; |
| for (SwitchCase switchCase : predecessorDescription.cases) { |
| switchValue->appendCase(switchCase); |
| predecessorCases.append(switchCase.caseValue()); |
| } |
| std::sort(predecessorCases.begin(), predecessorCases.end()); |
| auto isPredecessorCase = [&] (int64_t value) -> bool { |
| return !!tryBinarySearch<int64_t>( |
| predecessorCases, predecessorCases.size(), value, |
| [] (int64_t* element) -> int64_t { return *element; }); |
| }; |
| |
| for (SwitchCase switchCase : description.cases) { |
| if (!isPredecessorCase(switchCase.caseValue())) |
| switchValue->appendCase(switchCase); |
| } |
| return true; |
| } |
| |
| struct SwitchDescription { |
| SwitchDescription() |
| { |
| } |
| |
| explicit operator bool() { return !!block; } |
| |
| void dump(PrintStream& out) const |
| { |
| out.print( |
| "{block = ", pointerDump(block), |
| ", branch = ", pointerDump(branch), |
| ", extra = ", pointerDump(extra), |
| ", source = ", pointerDump(source), |
| ", cases = ", listDump(cases), |
| ", fallThrough = ", fallThrough, "}"); |
| } |
| |
| BasicBlock* block { nullptr }; |
| Value* branch { nullptr }; |
| Value* extra { nullptr }; // This is the Equal or NotEqual value, if applicable. |
| Value* source { nullptr }; |
| Vector<SwitchCase, 1> cases; |
| FrequentedBlock fallThrough; |
| }; |
| |
| SwitchDescription describe(BasicBlock* block) |
| { |
| SwitchDescription result; |
| result.block = block; |
| result.branch = block->last(); |
| |
| switch (result.branch->opcode()) { |
| case Branch: { |
| Value* predicate = result.branch->child(0); |
| FrequentedBlock taken = result.block->taken(); |
| FrequentedBlock notTaken = result.block->notTaken(); |
| bool handled = false; |
| // NOTE: This uses UseCounts that we computed before any transformation. This is fine |
| // because although we may have mutated the IR, we would not have added any new |
| // predicates. |
| if (predicate->numChildren() == 2 |
| && predicate->child(1)->hasInt() |
| && m_useCounts.numUses(predicate) == 1) { |
| switch (predicate->opcode()) { |
| case Equal: |
| result.source = predicate->child(0); |
| result.extra = predicate; |
| result.cases.append(SwitchCase(predicate->child(1)->asInt(), taken)); |
| result.fallThrough = notTaken; |
| handled = true; |
| break; |
| case NotEqual: |
| result.source = predicate->child(0); |
| result.extra = predicate; |
| result.cases.append(SwitchCase(predicate->child(1)->asInt(), notTaken)); |
| result.fallThrough = taken; |
| handled = true; |
| break; |
| default: |
| break; |
| } |
| } |
| if (handled) |
| break; |
| result.source = predicate; |
| result.cases.append(SwitchCase(0, notTaken)); |
| result.fallThrough = taken; |
| break; |
| } |
| |
| case Switch: { |
| SwitchValue* switchValue = result.branch->as<SwitchValue>(); |
| result.source = switchValue->child(0); |
| for (SwitchCase switchCase : switchValue->cases(result.block)) |
| result.cases.append(switchCase); |
| result.fallThrough = result.block->fallThrough(); |
| break; |
| } |
| |
| default: |
| result.block = nullptr; |
| result.branch = nullptr; |
| break; |
| } |
| |
| return result; |
| } |
| |
| Procedure& m_proc; |
| InsertionSet m_insertionSet; |
| UseCounts m_useCounts; |
| }; |
| |
| } // anonymous namespace |
| |
| bool inferSwitches(Procedure& proc) |
| { |
| PhaseScope phaseScope(proc, "inferSwitches"); |
| InferSwitches inferSwitches(proc); |
| return inferSwitches.run(); |
| } |
| |
| } } // namespace JSC::B3 |
| |
| #endif // ENABLE(B3_JIT) |
| |