blob: afbaeaac60a39e64cfcb4781882cd38a39036e1d [file] [log] [blame]
/*
* Copyright (C) 2015 Apple Inc. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS''
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
* THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
* THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "config.h"
#include "DFACombiner.h"
#if ENABLE(CONTENT_EXTENSIONS)
#include "MutableRangeList.h"
#include <wtf/HashMap.h>
#include <wtf/HashSet.h>
namespace WebCore {
namespace ContentExtensions {
class DFAMerger {
typedef MutableRangeList<signed char, uint64_t, 128> CombinedTransitionsMutableRangeList;
enum class WhichDFA {
A,
B
};
template<WhichDFA whichDFA>
struct TargetConverter {
uint64_t convert(uint32_t target)
{
uint64_t value = 0xffffffffffffffff;
extend(value, target);
return value;
}
void extend(uint64_t& destination, uint32_t target)
{
setHalfSignature(destination, target);
}
private:
void setHalfSignature(uint64_t& signature, uint32_t value)
{
unsigned shiftAmount = (whichDFA == WhichDFA::A) ? 32 : 0;
uint64_t mask = static_cast<uint64_t>(0xffffffff) << (32 - shiftAmount);
signature = (signature & mask) | static_cast<uint64_t>(value) << shiftAmount;
}
};
public:
DFAMerger(const DFA& a, const DFA& b)
: m_dfaA(a)
, m_dfaB(b)
{
}
DFA merge()
{
if (!m_nodeMapping.isEmpty())
return m_output;
uint64_t rootSignature = signatureForIndices(m_dfaA.root, m_dfaB.root);
getOrCreateCombinedNode(rootSignature);
CombinedTransitionsMutableRangeList combinedTransitions;
while (!m_unprocessedNodes.isEmpty()) {
combinedTransitions.clear();
uint64_t unprocessedNode = m_unprocessedNodes.takeLast();
uint32_t indexA = extractIndexA(unprocessedNode);
if (indexA != invalidNodeIndex) {
const DFANode& nodeA = m_dfaA.nodes[indexA];
auto transitionsA = nodeA.transitions(m_dfaA);
TargetConverter<WhichDFA::A> converterA;
combinedTransitions.extend(transitionsA.begin(), transitionsA.end(), converterA);
}
uint32_t indexB = extractIndexB(unprocessedNode);
if (indexB != invalidNodeIndex) {
const DFANode& nodeB = m_dfaB.nodes[indexB];
auto transitionsB = nodeB.transitions(m_dfaB);
TargetConverter<WhichDFA::B> converterB;
combinedTransitions.extend(transitionsB.begin(), transitionsB.end(), converterB);
}
unsigned transitionsStart = m_output.transitionRanges.size();
for (const auto& range : combinedTransitions) {
unsigned targetNodeId = getOrCreateCombinedNode(range.data);
m_output.transitionRanges.append({ range.first, range.last });
m_output.transitionDestinations.append(targetNodeId);
}
unsigned transitionsEnd = m_output.transitionRanges.size();
unsigned transitionsLength = transitionsEnd - transitionsStart;
uint32_t sourceNodeId = m_nodeMapping.get(unprocessedNode);
DFANode& dfaSourceNode = m_output.nodes[sourceNodeId];
dfaSourceNode.setTransitions(transitionsStart, static_cast<uint8_t>(transitionsLength));
}
return m_output;
}
private:
uint32_t invalidNodeIndex = 0xffffffff;
static uint64_t signatureForIndices(uint32_t aIndex, uint32_t bIndex)
{
return static_cast<uint64_t>(aIndex) << 32 | bIndex;
}
static uint32_t extractIndexA(uint64_t signature)
{
return static_cast<uint32_t>(signature >> 32);
}
static uint32_t extractIndexB(uint64_t signature)
{
return static_cast<uint32_t>(signature);
}
uint32_t getOrCreateCombinedNode(uint64_t newNodeSignature)
{
auto addResult = m_nodeMapping.add(newNodeSignature, invalidNodeIndex);
if (!addResult.isNewEntry)
return addResult.iterator->value;
m_output.nodes.append(DFANode());
uint32_t newNodeIndex = m_output.nodes.size() - 1;
addResult.iterator->value = newNodeIndex;
m_unprocessedNodes.append(newNodeSignature);
uint32_t indexA = extractIndexA(newNodeSignature);
uint32_t indexB = extractIndexB(newNodeSignature);
HashSet<uint64_t, DefaultHash<uint64_t>::Hash, WTF::UnsignedWithZeroKeyHashTraits<uint64_t>> actions;
if (indexA != invalidNodeIndex) {
const DFANode& node = m_dfaA.nodes[indexA];
uint32_t actionsStart = node.actionsStart();
uint32_t actionsEnd = actionsStart + node.actionsLength();
for (uint32_t i = actionsStart; i < actionsEnd; ++i)
actions.add(m_dfaA.actions[i]);
}
if (indexB != invalidNodeIndex) {
const DFANode& node = m_dfaB.nodes[indexB];
uint32_t actionsStart = node.actionsStart();
uint32_t actionsEnd = actionsStart + node.actionsLength();
for (uint32_t i = actionsStart; i < actionsEnd; ++i)
actions.add(m_dfaB.actions[i]);
}
uint32_t actionsStart = m_output.actions.size();
for (uint64_t action : actions)
m_output.actions.append(action);
uint32_t actionsEnd = m_output.actions.size();
uint16_t actionsLength = static_cast<uint16_t>(actionsEnd - actionsStart);
m_output.nodes.last().setActions(actionsStart, actionsLength);
return newNodeIndex;
}
const DFA& m_dfaA;
const DFA& m_dfaB;
DFA m_output;
HashMap<uint64_t, uint32_t, DefaultHash<uint64_t>::Hash, WTF::UnsignedWithZeroKeyHashTraits<uint64_t>> m_nodeMapping;
Vector<uint64_t, 0, ContentExtensionsOverflowHandler> m_unprocessedNodes;
};
void DFACombiner::combineDFAs(unsigned minimumSize, const WTF::Function<void(DFA&&)>& handler)
{
if (m_dfas.isEmpty())
return;
for (unsigned i = m_dfas.size(); i--;) {
if (m_dfas[i].graphSize() > minimumSize) {
handler(WTFMove(m_dfas[i]));
m_dfas.remove(i);
}
}
while (!m_dfas.isEmpty()) {
if (m_dfas.size() == 1) {
handler(WTFMove(m_dfas.first()));
return;
}
DFA a = m_dfas.takeLast();
DFA b = m_dfas.takeLast();
DFAMerger dfaMerger(a, b);
DFA c = dfaMerger.merge();
if (c.graphSize() > minimumSize || m_dfas.isEmpty()) {
// Minimizing is somewhat expensive. We only do it in bulk when we reach the threshold
// to reduce the load.
c.minimize();
}
if (c.graphSize() > minimumSize)
handler(WTFMove(c));
else
m_dfas.append(c);
}
}
}
} // namespace WebCore
#endif